├── .github
    ├── renovate.json5
    └── workflows
    │   ├── codeflash.yml
    │   ├── publish.yml
    │   └── tests.yml
├── .gitignore
├── .mailmap
├── .pre-commit-config.yaml
├── .python-version
├── .secrets.allowlist
├── CITATION.cff
├── LICENSE
├── README.md
├── citation.bib
├── docs
    └── assets
    │   ├── Aviary.png
    │   ├── ldp_chessboard.png
    │   └── ldp_definition.png
├── packages
    └── lmi
    │   ├── LICENSE
    │   ├── README.md
    │   ├── pyproject.toml
    │   ├── src
    │       └── lmi
    │       │   ├── __init__.py
    │       │   ├── constants.py
    │       │   ├── cost_tracker.py
    │       │   ├── embeddings.py
    │       │   ├── exceptions.py
    │       │   ├── llms.py
    │       │   ├── py.typed
    │       │   ├── rate_limiter.py
    │       │   ├── types.py
    │       │   └── utils.py
    │   └── tests
    │       ├── __init__.py
    │       ├── cassettes
    │           ├── TestLiteLLMEmbeddingModel.test_caching.yaml
    │           ├── TestLiteLLMModel.test_call[Anthropic-model].yaml
    │           ├── TestLiteLLMModel.test_call[OpenAI-model].yaml
    │           ├── TestLiteLLMModel.test_call[chat-model].yaml
    │           ├── TestLiteLLMModel.test_call[completion-model].yaml
    │           ├── TestLiteLLMModel.test_call_single[with-router].yaml
    │           ├── TestLiteLLMModel.test_call_single[without-router].yaml
    │           ├── TestLiteLLMModel.test_call_w_figure.yaml
    │           ├── TestLiteLLMModel.test_call_w_multiple_models[multiple-models].yaml
    │           ├── TestLiteLLMModel.test_call_with_prompt[with-router].yaml
    │           ├── TestLiteLLMModel.test_call_with_prompt[without-router].yaml
    │           ├── TestLiteLLMModel.test_cost_call[Anthropic-model].yaml
    │           ├── TestLiteLLMModel.test_cost_call[OpenAI-model].yaml
    │           ├── TestLiteLLMModel.test_cost_call_single[with-router].yaml
    │           ├── TestLiteLLMModel.test_cost_call_single[without-router].yaml
    │           ├── TestLiteLLMModel.test_max_token_truncation[with-router].yaml
    │           ├── TestLiteLLMModel.test_max_token_truncation[without-router].yaml
    │           ├── TestLiteLLMModel.test_run_prompt[with-router].yaml
    │           ├── TestLiteLLMModel.test_run_prompt[without-router].yaml
    │           ├── TestMultipleCompletion.test_model[gpt-3.5-turbo-0125].yaml
    │           ├── TestMultipleCompletion.test_model[gpt-3.5-turbo].yaml
    │           ├── TestMultipleCompletion.test_model[gpt-4o-mini-2024-07-18].yaml
    │           ├── TestMultipleCompletion.test_model[gpt-4o-mini].yaml
    │           ├── TestMultipleCompletion.test_model[gpt-4o].yaml
    │           ├── TestMultipleCompletion.test_multiple_completion[openai].yaml
    │           ├── TestMultipleCompletion.test_output_schema[json-mode-base-model].yaml
    │           ├── TestMultipleCompletion.test_output_schema[json-mode-type-adapter].yaml
    │           ├── TestMultipleCompletion.test_output_schema[structured-outputs].yaml
    │           ├── TestMultipleCompletion.test_parameterizing_tool_from_arg_union.yaml
    │           ├── TestMultipleCompletion.test_single_completion[claude-3-5-haiku-20241022].yaml
    │           ├── TestMultipleCompletion.test_single_completion[claude-3-haiku-20240307].yaml
    │           ├── TestMultipleCompletion.test_single_completion[gpt-3.5-turbo-0125].yaml
    │           ├── TestMultipleCompletion.test_single_completion[gpt-3.5-turbo].yaml
    │           ├── TestMultipleCompletion.test_single_completion[gpt-4o-mini-2024-07-18].yaml
    │           ├── TestMultipleCompletion.test_text_image_message[gpt-4o-mini-2024-07-18].yaml
    │           ├── TestReasoning.test_deepseek_model[deepseek-reasoner].yaml
    │           ├── TestReasoning.test_deepseek_model[openrouter-deepseek].yaml
    │           ├── TestTooling.test_empty_tools[Anthropic-empty-tools].yaml
    │           ├── TestTooling.test_empty_tools[Anthropic-no-tools].yaml
    │           ├── TestTooling.test_empty_tools[OpenAI-empty-tools].yaml
    │           ├── TestTooling.test_empty_tools[OpenAI-no-tools].yaml
    │           └── TestTooling.test_tool_selection.yaml
    │       ├── conftest.py
    │       ├── test_cost_tracking.py
    │       ├── test_embeddings.py
    │       ├── test_llms.py
    │       └── test_rate_limiter.py
├── pyproject.toml
├── src
    └── ldp
    │   ├── __init__.py
    │   ├── agent
    │       ├── __init__.py
    │       ├── agent.py
    │       ├── agent_client.py
    │       ├── interactive_agent.py
    │       ├── memory_agent.py
    │       ├── react_agent.py
    │       ├── simple_agent.py
    │       └── tree_of_thoughts_agent.py
    │   ├── alg
    │       ├── __init__.py
    │       ├── algorithms.py
    │       ├── beam_search.py
    │       ├── callbacks.py
    │       ├── datasets.py
    │       ├── optimizer
    │       │   ├── __init__.py
    │       │   ├── ape.py
    │       │   ├── memory.py
    │       │   ├── opt.py
    │       │   └── replay_buffers.py
    │       ├── rollout.py
    │       ├── runners.py
    │       └── tree_search.py
    │   ├── data_structures.py
    │   ├── graph
    │       ├── __init__.py
    │       ├── async_torch.py
    │       ├── common_ops.py
    │       ├── gradient_estimators.py
    │       ├── loss_ops.py
    │       ├── memory.py
    │       ├── modules
    │       │   ├── __init__.py
    │       │   ├── llm_call.py
    │       │   ├── react.py
    │       │   ├── reflect.py
    │       │   └── thought.py
    │       ├── op_utils.py
    │       ├── ops.py
    │       └── torch_ops.py
    │   ├── llms
    │       ├── __init__.py
    │       └── prompts.py
    │   ├── main.py
    │   ├── nn
    │       ├── __init__.py
    │       ├── agent
    │       │   └── simple_local_agent.py
    │       ├── chat_templates
    │       │   ├── README.md
    │       │   ├── llama2_chat_template_ori.jinja
    │       │   ├── llama3.1_chat_template_hf.jinja
    │       │   ├── llama3.1_chat_template_nothought.jinja
    │       │   ├── llama3.1_chat_template_thought.jinja
    │       │   ├── llama3.1_chat_template_vllm.jinja
    │       │   └── llama3_chat_template_ori.jinja
    │       ├── generation
    │       │   ├── __init__.py
    │       │   └── base.py
    │       ├── graph
    │       │   └── llm_call_op.py
    │       ├── handlers
    │       │   ├── chunking.py
    │       │   ├── module_handler.py
    │       │   └── transformer_handler.py
    │       ├── lm_config.py
    │       └── utils.py
    │   ├── py.typed
    │   ├── shims.py
    │   └── utils.py
├── tests
    ├── .gitignore
    ├── __init__.py
    ├── cassettes
    │   ├── TestAgentState.test_no_state_mutation[agent0].yaml
    │   ├── TestAgentState.test_no_state_mutation[agent1].yaml
    │   ├── TestAgentState.test_no_state_mutation[agent2].yaml
    │   ├── TestHTTPAgentClient.test_lifecycle.yaml
    │   ├── TestLLMCallOp.test_compute_logprob[0.0].yaml
    │   ├── TestLLMCallOp.test_compute_logprob[0.5].yaml
    │   ├── TestLLMCallOp.test_compute_logprob[1.0].yaml
    │   ├── TestLLMCallOp.test_cost_tracking.yaml
    │   ├── TestLLMCallOp.test_empty_tools.yaml
    │   ├── TestLLMCallOp.test_validation.yaml
    │   ├── TestLLMModel.test_model[claude-3-haiku-20240307].yaml
    │   ├── TestLLMModel.test_model[gpt-3.5-turbo].yaml
    │   ├── TestLLMModel.test_output_schema[json-mode].yaml
    │   ├── TestLLMModel.test_output_schema[structured-outputs].yaml
    │   ├── TestLLMModel.test_output_type_rejected_validation.yaml
    │   ├── TestLLMModel.test_parameterizing_tool_from_arg_union.yaml
    │   ├── TestLLMModel.test_streaming[claude-3-haiku-20240307].yaml
    │   ├── TestLLMModel.test_streaming[gpt-3.5-turbo].yaml
    │   ├── TestLLMModel.test_text_image_message[claude-3-haiku-20240307].yaml
    │   ├── TestLLMModel.test_text_image_message[gpt-4-turbo].yaml
    │   ├── TestLLMModel.test_text_image_message[gpt-4o-mini-2024-07-18].yaml
    │   ├── TestLiteEmbeddingModel.test_caching.yaml
    │   ├── TestMemoryAgent.test_agent_grad.yaml
    │   ├── TestMemoryAgent.test_dummyenv[gpt-4o-mini-2024-07-18].yaml
    │   ├── TestMemoryOpt.test_lessons_memory_optimizer.yaml
    │   ├── TestMultipleCompletionLLMModel.test_model[gpt-3.5-turbo].yaml
    │   ├── TestMultipleCompletionLLMModel.test_output_schema[json-mode].yaml
    │   ├── TestMultipleCompletionLLMModel.test_output_schema[structured-outputs].yaml
    │   ├── TestMultipleCompletionLLMModel.test_parameterizing_tool_from_arg_union.yaml
    │   ├── TestMultipleCompletionLLMModel.test_text_image_message[gpt-4o-mini-2024-07-18].yaml
    │   ├── TestNoToolsSimpleAgent.test_dummyenv[claude-3-5-haiku-20241022].yaml
    │   ├── TestNoToolsSimpleAgent.test_dummyenv[claude-3-haiku-20240307].yaml
    │   ├── TestNoToolsSimpleAgent.test_dummyenv[gpt-4o-mini-2024-07-18].yaml
    │   ├── TestParallelism.test_SimpleAgent_can_parallel_call.yaml
    │   ├── TestReActAgent.test_agent_grad[False-claude-3-5-haiku-20241022].yaml
    │   ├── TestReActAgent.test_agent_grad[False-claude-3-haiku-20240307].yaml
    │   ├── TestReActAgent.test_agent_grad[False-gpt-4o].yaml
    │   ├── TestReActAgent.test_agent_grad[True-claude-3-5-haiku-20241022].yaml
    │   ├── TestReActAgent.test_agent_grad[True-claude-3-haiku-20240307].yaml
    │   ├── TestReActAgent.test_agent_grad[True-gpt-4-turbo].yaml
    │   ├── TestReActAgent.test_multi_step[False].yaml
    │   ├── TestReActAgent.test_multi_step[True].yaml
    │   ├── TestReActAgent.test_react_dummyenv[False-claude-3-5-haiku-20241022].yaml
    │   ├── TestReActAgent.test_react_dummyenv[False-claude-3-haiku-20240307].yaml
    │   ├── TestReActAgent.test_react_dummyenv[False-gpt-4o].yaml
    │   ├── TestReActAgent.test_react_dummyenv[True-claude-3-5-haiku-20241022].yaml
    │   ├── TestReActAgent.test_react_dummyenv[True-claude-3-haiku-20240307].yaml
    │   ├── TestReActAgent.test_react_dummyenv[True-gpt-4-turbo].yaml
    │   ├── TestSimpleAgent.test_agent_grad[claude-3-5-haiku-20241022].yaml
    │   ├── TestSimpleAgent.test_agent_grad[claude-3-haiku-20240307].yaml
    │   ├── TestSimpleAgent.test_agent_grad[gpt-4o-mini-2024-07-18].yaml
    │   ├── TestSimpleAgent.test_dummyenv[claude-3-5-haiku-20241022].yaml
    │   ├── TestSimpleAgent.test_dummyenv[claude-3-haiku-20240307].yaml
    │   ├── TestSimpleAgent.test_dummyenv[gpt-4o-mini-2024-07-18].yaml
    │   ├── TestSimpleAgent.test_hide_old_action_content.yaml
    │   ├── TestSimpleAgent.test_hide_old_env_states.yaml
    │   ├── test_beam_search.yaml
    │   ├── test_embedding_op[text-embedding-3-large-0-256].yaml
    │   ├── test_embedding_op[text-embedding-3-large-0-512].yaml
    │   ├── test_embedding_op[text-embedding-3-large-32-256].yaml
    │   ├── test_embedding_op[text-embedding-3-large-32-512].yaml
    │   ├── test_embedding_op[text-embedding-3-large-64-256].yaml
    │   ├── test_embedding_op[text-embedding-3-large-64-512].yaml
    │   ├── test_embedding_op[text-embedding-3-small-0-256].yaml
    │   ├── test_embedding_op[text-embedding-3-small-0-512].yaml
    │   ├── test_embedding_op[text-embedding-3-small-32-256].yaml
    │   ├── test_embedding_op[text-embedding-3-small-32-512].yaml
    │   ├── test_embedding_op[text-embedding-3-small-64-256].yaml
    │   ├── test_embedding_op[text-embedding-3-small-64-512].yaml
    │   ├── test_fallbacks_working[False].yaml
    │   ├── test_fallbacks_working[True].yaml
    │   ├── test_llm_call_graph.yaml
    │   ├── test_offline_trainer[False].yaml
    │   ├── test_offline_trainer[True].yaml
    │   ├── test_online_trainer[False].yaml
    │   ├── test_online_trainer[True].yaml
    │   ├── test_reflect_module.yaml
    │   ├── test_rollout[False].yaml
    │   └── test_rollout[True].yaml
    ├── conftest.py
    ├── test_agents.py
    ├── test_algorithms.py
    ├── test_buffers.py
    ├── test_context_managers.py
    ├── test_data_structures.py
    ├── test_envs.py
    ├── test_gradients.py
    ├── test_loss_ops.py
    ├── test_memory.py
    ├── test_modules.py
    ├── test_nn_models.py
    ├── test_nn_ops.py
    ├── test_ops.py
    ├── test_optimizer.py
    ├── test_prompts.py
    ├── test_rollouts.py
    ├── test_runners.py
    ├── test_shims.py
    ├── test_torch_ops.py
    └── test_utils.py
├── tutorials
    ├── creating_a_language_agent.ipynb
    └── evaluating_a_llama_agent.ipynb
└── uv.lock


/.github/renovate.json5:
--------------------------------------------------------------------------------
 1 | {
 2 |   $schema: "https://docs.renovatebot.com/renovate-schema.json",
 3 |   extends: ["config:recommended"],
 4 |   schedule: ["* 2 1-7 * 1"],
 5 |   prHourlyLimit: 4,
 6 |   timezone: "America/Los_Angeles",
 7 |   rangeStrategy: "widen",
 8 |   lockFileMaintenance: {
 9 |     enabled: true,
10 |     schedule: ["* 2 1-7 * 1"], // Work around https://github.com/renovatebot/renovate/discussions/33152
11 |   },
12 |   minimumReleaseAge: "2 weeks",
13 |   "pre-commit": {
14 |     enabled: true,
15 |   },
16 |   packageRules: [
17 |     {
18 |       matchUpdateTypes: ["lockFileMaintenance"],
19 |       automerge: true,
20 |     },
21 |     {
22 |       // group:allNonMajor, with automerge
23 |       groupName: "all non-major dependencies",
24 |       groupSlug: "all-minor-patch",
25 |       matchPackageNames: ["*"],
26 |       matchUpdateTypes: ["minor", "patch"],
27 |       automerge: true,
28 |     },
29 |     {
30 |       // TODO: remove after torch supports Python 3.13
31 |       matchPackageNames: ["python"],
32 |       allowedVersions: "<=3.12",
33 |     },
34 |   ],
35 | }
36 | 


--------------------------------------------------------------------------------
/.github/workflows/codeflash.yml:
--------------------------------------------------------------------------------
 1 | name: CodeFlash
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     paths:
 6 |       - "ldp/**"
 7 |       - "src/**"
 8 |       - "packages/**"
 9 |   workflow_dispatch:
10 | 
11 | concurrency: # Cancel prior if new push, SEE: https://stackoverflow.com/a/72408109
12 |   group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
13 |   cancel-in-progress: true
14 | 
15 | jobs:
16 |   optimize: # SEE: https://docs.codeflash.ai/getting-started/codeflash-github-actions
17 |     runs-on: ubuntu-latest
18 |     env:
19 |       CODEFLASH_API_KEY: ${{ secrets.CODEFLASH_API_KEY }}
20 |       CODEFLASH_PR_NUMBER: ${{ github.event.number }}
21 |     steps:
22 |       - name: Check if PR is from CodeFlash bot
23 |         id: bot_check
24 |         working-directory: .
25 |         run: |
26 |           echo "Checking if this PR is created by CodeFlash bot..."
27 |           if [ "${{ github.event.pull_request.user.login }}" == "codeflash-ai[bot]" ]; then
28 |             echo "PR created by Codeflash bot. Skipping optimization."
29 |             echo "skip_remaining_steps=yes" >> $GITHUB_OUTPUT
30 |           else
31 |             echo "skip_remaining_steps=no" >> $GITHUB_OUTPUT
32 |             echo "It's not. Proceeding with the optimization."
33 |           fi
34 |       - if: steps.bot_check.outputs.skip_remaining_steps == 'no'
35 |         uses: actions/checkout@v4
36 |         with:
37 |           fetch-depth: 0
38 |       - if: steps.bot_check.outputs.skip_remaining_steps == 'no'
39 |         uses: astral-sh/setup-uv@v5
40 |         with:
41 |           enable-cache: true
42 |       - if: steps.bot_check.outputs.skip_remaining_steps == 'no'
43 |         run: uv sync --group=codeflash
44 |       - if: steps.bot_check.outputs.skip_remaining_steps == 'no'
45 |         name: Run CodeFlash on ldp
46 |         run: uv run codeflash --module-root=src/ldp --tests-root=tests
47 |       - if: steps.bot_check.outputs.skip_remaining_steps == 'no'
48 |         name: Run CodeFlash on lmi
49 |         run: uv run codeflash --module-root=packages/lmi/src/lmi --tests-root=packages/lmi/tests
50 | 


--------------------------------------------------------------------------------
/.github/workflows/publish.yml:
--------------------------------------------------------------------------------
 1 | name: Publish
 2 | 
 3 | on:
 4 |   release:
 5 |     types: [created]
 6 |   workflow_dispatch:
 7 | 
 8 | jobs:
 9 |   publish:
10 |     runs-on: ubuntu-latest
11 |     steps:
12 |       - uses: actions/checkout@v4
13 |       - id: build-ldp
14 |         uses: hynek/build-and-inspect-python-package@v2
15 |         with:
16 |           upload-name-suffix: -ldp
17 |       - name: Download built artifact to dist/
18 |         uses: actions/download-artifact@v4
19 |         with:
20 |           name: ${{ steps.build-ldp.outputs.artifact-name }}
21 |           path: dist_ldp
22 |       - id: build-fhlmi
23 |         uses: hynek/build-and-inspect-python-package@v2
24 |         with:
25 |           path: packages/lmi
26 |           upload-name-suffix: -fhlmi
27 |       - name: Download built artifact to dist/
28 |         uses: actions/download-artifact@v4
29 |         with:
30 |           name: ${{ steps.build-fhlmi.outputs.artifact-name }}
31 |           path: dist_fhlmi
32 |       - uses: pypa/gh-action-pypi-publish@release/v1
33 |         with:
34 |           password: ${{ secrets.PYPI_API_LDP_TOKEN }}
35 |           packages-dir: dist_ldp
36 |       - uses: pypa/gh-action-pypi-publish@release/v1
37 |         with:
38 |           password: ${{ secrets.PYPI_API_LMI_TOKEN }}
39 |           packages-dir: dist_fhlmi
40 | 


--------------------------------------------------------------------------------
/.github/workflows/tests.yml:
--------------------------------------------------------------------------------
 1 | name: Lint and Test
 2 | 
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 |       - renovate/*
 8 |   pull_request:
 9 |   workflow_dispatch:
10 | 
11 | jobs:
12 |   pre-commit:
13 |     runs-on: ubuntu-latest
14 |     if: github.event_name == 'pull_request' # pre-commit-ci/lite-action only runs here
15 |     strategy:
16 |       matrix:
17 |         python-version: [3.11, 3.13] # Our min and max supported Python versions
18 |     steps:
19 |       - uses: actions/checkout@v4
20 |         with:
21 |           fetch-depth: 0 # For setuptools-scm, replace with fetch-tags after https://github.com/actions/checkout/issues/1471
22 |       - uses: actions/setup-python@v5
23 |         with:
24 |           python-version: ${{ matrix.python-version }}
25 |       - uses: astral-sh/setup-uv@v5
26 |         with:
27 |           enable-cache: true
28 |       - run: echo "UV_PROJECT_ENVIRONMENT=$(python -c "import sysconfig; print(sysconfig.get_config_var('prefix'))")" >> $GITHUB_ENV
29 |       - run: uv python pin ${{ matrix.python-version }} # uv requires .python-version to match OS Python: https://github.com/astral-sh/uv/issues/11389
30 |       - run: uv sync --python-preference only-system
31 |       - run: git checkout .python-version # For clean git diff given `pre-commit run --show-diff-on-failure`
32 |       - uses: pre-commit/action@v3.0.1
33 |       - uses: pre-commit-ci/lite-action@v1.1.0
34 |         if: always()
35 |   lint:
36 |     runs-on: ubuntu-latest
37 |     strategy:
38 |       matrix:
39 |         python-version: [3.11, 3.13] # Our min and max supported Python versions
40 |     steps:
41 |       - uses: actions/checkout@v4
42 |       - uses: astral-sh/setup-uv@v5
43 |         with:
44 |           enable-cache: true
45 |       - run: uv python pin ${{ matrix.python-version }}
46 |       - run: uv sync --python-preference=only-managed
47 |       - run: uv run refurb .
48 |       - if: matrix.python-version == '3.11' # Only need to run this on one version
49 |         uses: suzuki-shunsuke/github-action-renovate-config-validator@v1.1.1
50 |   test-ldp:
51 |     runs-on: ubuntu-latest
52 |     steps:
53 |       - uses: actions/checkout@v4
54 |       - uses: astral-sh/setup-uv@v5
55 |         with:
56 |           enable-cache: true
57 |       - run: uv sync
58 |       - run: uv run pytest -n 16 --dist=loadfile tests
59 |         env:
60 |           OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
61 |           ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
62 |   test-lmi:
63 |     runs-on: ubuntu-latest
64 |     steps:
65 |       - uses: actions/checkout@v4
66 |       - uses: astral-sh/setup-uv@v5
67 |         with:
68 |           enable-cache: true
69 |       - run: uv sync
70 |       - run: |
71 |           uv run pytest -n 16 --dist=loadfile packages/lmi/tests
72 |         env:
73 |           OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
74 |           ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
75 | 


--------------------------------------------------------------------------------
/.mailmap:
--------------------------------------------------------------------------------
1 | Andrew White <andrew@futurehouse.org> <white.d.andrew@gmail.com>
2 | James Braza <james@futurehouse.org> <jamesbraza@gmail.com>
3 | Mayk Caldas <mayk@futurehouse.org> maykcaldas
4 | Michael Skarlinski <mskarlinski@futurehouse.org> mskarlin <12701035+mskarlin@users.noreply.github.com>
5 | Ryan-Rhys Griffiths <ryan@futurehouse.org> <ryangriff123@gmail.com>
6 | Siddharth Narayanan <sid@futurehouse.org> <sidnarayanan@users.noreply.github.com>
7 | 


--------------------------------------------------------------------------------
/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | ---
 2 | default_language_version:
 3 |   python: python3
 4 | repos:
 5 |   - repo: https://github.com/pre-commit/pre-commit-hooks
 6 |     rev: v5.0.0
 7 |     hooks:
 8 |       - id: check-added-large-files
 9 |       - id: check-byte-order-marker
10 |       - id: check-case-conflict
11 |       - id: check-merge-conflict
12 |       - id: check-shebang-scripts-are-executable
13 |       - id: check-symlinks
14 |       - id: check-toml
15 |       - id: check-yaml
16 |       - id: debug-statements
17 |       - id: detect-private-key
18 |       - id: end-of-file-fixer
19 |       - id: mixed-line-ending
20 |       - id: trailing-whitespace
21 |   - repo: https://github.com/jsh9/markdown-toc-creator
22 |     rev: 0.0.10
23 |     hooks:
24 |       - id: markdown-toc-creator
25 |   - repo: https://github.com/astral-sh/ruff-pre-commit
26 |     rev: v0.9.9
27 |     hooks:
28 |       - id: ruff
29 |         args: [--fix, --exit-non-zero-on-fix]
30 |       - id: ruff-format
31 |   - repo: https://github.com/rbubley/mirrors-prettier
32 |     rev: v3.5.3
33 |     hooks:
34 |       - id: prettier
35 |   - repo: https://github.com/Yelp/detect-secrets
36 |     rev: v1.5.0
37 |     hooks:
38 |       - id: detect-secrets
39 |         additional_dependencies: [".[word_list]"]
40 |         args:
41 |           - --word-list=.secrets.allowlist
42 |           - --exclude-files=.secrets.baseline$
43 |         exclude: tests/cassettes
44 |   - repo: https://github.com/adamchainz/blacken-docs
45 |     rev: 1.19.1
46 |     hooks:
47 |       - id: blacken-docs
48 |   - repo: https://github.com/jsh9/markdown-toc-creator
49 |     rev: 0.0.10
50 |     hooks:
51 |       - id: markdown-toc-creator
52 |   - repo: https://github.com/jumanjihouse/pre-commit-hooks
53 |     rev: 3.0.0
54 |     hooks:
55 |       - id: check-mailmap
56 |   - repo: https://github.com/codespell-project/codespell
57 |     rev: v2.4.1
58 |     hooks:
59 |       - id: codespell
60 |         additional_dependencies: [".[toml]"]
61 |         exclude_types: [jupyter]
62 |   - repo: https://github.com/pappasam/toml-sort
63 |     rev: v0.24.2
64 |     hooks:
65 |       - id: toml-sort-fix
66 |   - repo: https://github.com/srstevenson/nb-clean
67 |     rev: 4.0.1
68 |     hooks:
69 |       - id: nb-clean
70 |         args: [--preserve-cell-outputs, --remove-empty-cells]
71 |   - repo: https://github.com/henryiii/validate-pyproject-schema-store
72 |     rev: 2025.02.24
73 |     hooks:
74 |       - id: validate-pyproject
75 |   - repo: https://github.com/astral-sh/uv-pre-commit
76 |     rev: 0.6.3
77 |     hooks:
78 |       - id: uv-lock
79 |   - repo: local
80 |     hooks:
81 |       - id: mypy
82 |         name: mypy
83 |         entry: mypy
84 |         language: system
85 |         types_or: [python, pyi]
86 | 


--------------------------------------------------------------------------------
/.python-version:
--------------------------------------------------------------------------------
1 | 3.13
2 | 


--------------------------------------------------------------------------------
/.secrets.allowlist:
--------------------------------------------------------------------------------
1 | authorization
2 | x-api-key
3 | abc123
4 | 


--------------------------------------------------------------------------------
/CITATION.cff:
--------------------------------------------------------------------------------
 1 | ---
 2 | cff-version: 1.2.0
 3 | title: "Aviary: training language agents on challenging scientific tasks"
 4 | message: >-
 5 |   If you use this software, please cite it using the
 6 |   metadata from this file.
 7 | authors:
 8 |   - given-names: Siddharth
 9 |     family-names: Narayanan
10 |   - given-names: James D.
11 |     family-names: Braza
12 |   - given-names: Ryan-Rhys
13 |     family-names: Griffiths
14 |   - family-names: Ponnapati
15 |     given-names: Manvitha
16 |   - given-names: Albert
17 |     family-names: Bou
18 |   - given-names: Jon
19 |     family-names: Laurent
20 |   - given-names: Ori
21 |     family-names: Kabeli
22 |   - given-names: Geemi
23 |     family-names: Wellawatte
24 |   - given-names: Sam
25 |     family-names: Cox
26 |   - given-names: Samuel G.
27 |     family-names: Rodriques
28 |   - given-names: Andrew D.
29 |     family-names: White
30 | identifiers:
31 |   - type: doi
32 |     value: 10.48550/arXiv.2412.21154
33 |     description: ArXiv DOI
34 |   - type: url
35 |     value: https://arxiv.org/abs/2412.21154
36 |     description: ArXiv abstract
37 | repository-code: https://github.com/Future-House/ldp
38 | keywords:
39 |   - Artificial Intelligence
40 |   - Computation and Language
41 |   - Machine Learning
42 | license: Apache-2.0
43 | preferred-citation:
44 |   authors:
45 |     - given-names: Siddharth
46 |       family-names: Narayanan
47 |     - given-names: James D.
48 |       family-names: Braza
49 |     - given-names: Ryan-Rhys
50 |       family-names: Griffiths
51 |     - family-names: Ponnapati
52 |       given-names: Manvitha
53 |     - given-names: Albert
54 |       family-names: Bou
55 |     - given-names: Jon
56 |       family-names: Laurent
57 |     - given-names: Ori
58 |       family-names: Kabeli
59 |     - given-names: Geemi
60 |       family-names: Wellawatte
61 |     - given-names: Sam
62 |       family-names: Cox
63 |     - given-names: Samuel G.
64 |       family-names: Rodriques
65 |     - given-names: Andrew D.
66 |       family-names: White
67 |   date-published: 2024-12-30
68 |   doi: 10.48550/arXiv.2412.21154
69 |   journal: preprint
70 |   title: "Aviary: training language agents on challenging scientific tasks"
71 |   type: article
72 |   url: https://arxiv.org/abs/2412.21154
73 | 


--------------------------------------------------------------------------------
/citation.bib:
--------------------------------------------------------------------------------
1 | @article{narayanan2024aviary,
2 |   title={Aviary: training language agents on challenging scientific tasks},
3 |   author={Narayanan, Siddharth and Braza, James D and Griffiths, Ryan-Rhys and Ponnapati, Manu and Bou, Albert and Laurent, Jon and Kabeli, Ori and Wellawatte, Geemi and Cox, Sam and Rodriques, Samuel G and others},
4 |   journal={arXiv preprint arXiv:2412.21154},
5 |   year={2024}
6 | }
7 | 


--------------------------------------------------------------------------------
/docs/assets/Aviary.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Future-House/ldp/2e9557233dc0e4c8abbb9f1f065059108a0dcfcd/docs/assets/Aviary.png


--------------------------------------------------------------------------------
/docs/assets/ldp_chessboard.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Future-House/ldp/2e9557233dc0e4c8abbb9f1f065059108a0dcfcd/docs/assets/ldp_chessboard.png


--------------------------------------------------------------------------------
/docs/assets/ldp_definition.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Future-House/ldp/2e9557233dc0e4c8abbb9f1f065059108a0dcfcd/docs/assets/ldp_definition.png


--------------------------------------------------------------------------------
/packages/lmi/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | build-backend = "setuptools.build_meta"
 3 | requires = ["setuptools>=64", "setuptools_scm>=8"]
 4 | 
 5 | [dependency-groups]
 6 | codeflash = [
 7 |     "codeflash>=0.8",  # Pin for --verify-setup checking formatter-cmds
 8 |     "fhlmi[dev]",
 9 | ]
10 | dev = ["fhlmi[dev]"]
11 | 
12 | [project]
13 | authors = [
14 |     {email = "hello@futurehouse.org", name = "FutureHouse technical staff"},
15 | ]
16 | # Full list: https://pypi.python.org/pypi?%3Aaction=list_classifiers
17 | classifiers = [
18 |     "Operating System :: OS Independent",
19 |     "Programming Language :: Python :: 3 :: Only",
20 |     "Programming Language :: Python :: 3.11",
21 |     "Programming Language :: Python :: 3.12",
22 |     "Programming Language :: Python :: 3.13",
23 |     "Programming Language :: Python",
24 | ]
25 | dependencies = [
26 |     "coredis",
27 |     "fhaviary>=0.14.0",  # For multi-image support
28 |     "limits>=4.8",  # Pin for RedisBridge.key_prefix
29 |     "litellm>=1.63.5",  # Pin lower for reasoning + streaming fix
30 |     "pydantic~=2.0,>=2.10.1",
31 |     "tiktoken>=0.4.0",
32 |     "typing-extensions; python_version <= '3.11'",  # for typing.override
33 | ]
34 | description = "A client to provide LLM responses for FutureHouse applications."
35 | dynamic = ["version"]
36 | license = {file = "LICENSE"}
37 | name = "fhlmi"
38 | readme = "README.md"
39 | requires-python = ">=3.11"
40 | 
41 | [project.optional-dependencies]
42 | dev = [
43 |     "fhaviary[xml]",
44 |     "fhlmi[local,progress,typing,vcr]",
45 |     "ipython>=8",  # Pin to keep recent
46 |     "litellm>=1.68",  # Pin for PydanticDeprecatedSince20 fixes
47 |     "mypy>=1.8",  # Pin for mutable-override
48 |     "pre-commit>=3.4",  # Pin to keep recent
49 |     "pylint-pydantic",
50 |     "pytest-asyncio",
51 |     "pytest-recording",
52 |     "pytest-rerunfailures",
53 |     "pytest-subtests",
54 |     "pytest-sugar",
55 |     "pytest-timer[colorama]",
56 |     "pytest-xdist",
57 |     "pytest>=8",  # Pin to keep recent
58 |     "python-dotenv",
59 |     "refurb>=2",  # Pin to keep recent
60 |     "typeguard",
61 | ]
62 | local = [
63 |     "numpy",
64 |     "sentence-transformers",
65 | ]
66 | progress = ["tqdm"]
67 | typing = ["types-tqdm"]
68 | vcr = [
69 |     "vcrpy>=6",  # Pin for https://github.com/kevin1024/vcrpy/issues/884
70 | ]
71 | 
72 | [project.urls]
73 | issues = "https://github.com/Future-House/ldp/packages/lmi/issues"
74 | repository = "https://github.com/Future-House/ldp/packages/lmi"
75 | 
76 | [tool.ruff]
77 | extend = "../../pyproject.toml"
78 | 
79 | [tool.setuptools.packages.find]
80 | where = ["src"]
81 | 
82 | [tool.setuptools_scm]
83 | root = "../.."
84 | version_file = "src/lmi/version.py"
85 | 


--------------------------------------------------------------------------------
/packages/lmi/src/lmi/__init__.py:
--------------------------------------------------------------------------------
 1 | from .constants import (
 2 |     CHARACTERS_PER_TOKEN_ASSUMPTION,
 3 |     EXTRA_TOKENS_FROM_USER_ROLE,
 4 |     MODEL_COST_MAP,
 5 | )
 6 | from .cost_tracker import GLOBAL_COST_TRACKER, cost_tracking_ctx, enable_cost_tracking
 7 | from .embeddings import (
 8 |     EmbeddingModel,
 9 |     EmbeddingModes,
10 |     HybridEmbeddingModel,
11 |     LiteLLMEmbeddingModel,
12 |     SentenceTransformerEmbeddingModel,
13 |     SparseEmbeddingModel,
14 |     embedding_model_factory,
15 | )
16 | from .exceptions import (
17 |     JSONSchemaValidationError,
18 | )
19 | from .llms import (
20 |     CommonLLMNames,
21 |     LiteLLMModel,
22 |     LLMModel,
23 |     sum_logprobs,
24 |     validate_json_completion,
25 | )
26 | from .types import (
27 |     Embeddable,
28 |     LLMResult,
29 | )
30 | from .utils import (
31 |     configure_llm_logs,
32 | )
33 | 
34 | __all__ = [
35 |     "CHARACTERS_PER_TOKEN_ASSUMPTION",
36 |     "EXTRA_TOKENS_FROM_USER_ROLE",
37 |     "GLOBAL_COST_TRACKER",
38 |     "MODEL_COST_MAP",
39 |     "CommonLLMNames",
40 |     "Embeddable",
41 |     "EmbeddingModel",
42 |     "EmbeddingModes",
43 |     "HybridEmbeddingModel",
44 |     "JSONSchemaValidationError",
45 |     "LLMModel",
46 |     "LLMResult",
47 |     "LiteLLMEmbeddingModel",
48 |     "LiteLLMModel",
49 |     "SentenceTransformerEmbeddingModel",
50 |     "SparseEmbeddingModel",
51 |     "configure_llm_logs",
52 |     "cost_tracking_ctx",
53 |     "embedding_model_factory",
54 |     "enable_cost_tracking",
55 |     "sum_logprobs",
56 |     "validate_json_completion",
57 | ]
58 | 


--------------------------------------------------------------------------------
/packages/lmi/src/lmi/constants.py:
--------------------------------------------------------------------------------
 1 | from sys import version_info
 2 | 
 3 | import litellm
 4 | 
 5 | # Estimate from OpenAI's FAQ
 6 | # https://help.openai.com/en/articles/4936856-what-are-tokens-and-how-to-count-them
 7 | CHARACTERS_PER_TOKEN_ASSUMPTION: float = 4.0
 8 | # Added tokens from user/role message
 9 | # Need to add while doing rate limits
10 | # Taken from empirical counts in tests
11 | EXTRA_TOKENS_FROM_USER_ROLE: int = 7
12 | 
13 | MODEL_COST_MAP = litellm.get_model_cost_map("")
14 | 
15 | DEFAULT_VERTEX_SAFETY_SETTINGS: list[dict[str, str]] = [
16 |     {
17 |         "category": "HARM_CATEGORY_HARASSMENT",
18 |         "threshold": "BLOCK_ONLY_HIGH",
19 |     },
20 |     {
21 |         "category": "HARM_CATEGORY_HATE_SPEECH",
22 |         "threshold": "BLOCK_ONLY_HIGH",
23 |     },
24 |     {
25 |         "category": "HARM_CATEGORY_SEXUALLY_EXPLICIT",
26 |         "threshold": "BLOCK_ONLY_HIGH",
27 |     },
28 |     {
29 |         "category": "HARM_CATEGORY_DANGEROUS_CONTENT",
30 |         "threshold": "BLOCK_ONLY_HIGH",
31 |     },
32 | ]
33 | 
34 | IS_PYTHON_BELOW_312 = version_info < (3, 12)
35 | 


--------------------------------------------------------------------------------
/packages/lmi/src/lmi/exceptions.py:
--------------------------------------------------------------------------------
1 | class JSONSchemaValidationError(ValueError):
2 |     """Raised when the completion does not match the specified schema."""
3 | 


--------------------------------------------------------------------------------
/packages/lmi/src/lmi/py.typed:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Future-House/ldp/2e9557233dc0e4c8abbb9f1f065059108a0dcfcd/packages/lmi/src/lmi/py.typed


--------------------------------------------------------------------------------
/packages/lmi/src/lmi/types.py:
--------------------------------------------------------------------------------
  1 | import contextvars
  2 | import logging
  3 | from contextlib import contextmanager
  4 | from datetime import datetime
  5 | from uuid import UUID, uuid4
  6 | 
  7 | import litellm
  8 | from aviary.core import Message
  9 | from pydantic import (
 10 |     BaseModel,
 11 |     ConfigDict,
 12 |     Field,
 13 |     computed_field,
 14 | )
 15 | 
 16 | logger = logging.getLogger(__name__)
 17 | 
 18 | # A context var that will be unique to threads/processes
 19 | cvar_session_id = contextvars.ContextVar[UUID | None]("session_id", default=None)
 20 | 
 21 | 
 22 | @contextmanager
 23 | def set_llm_session_ids(session_id: UUID):
 24 |     token = cvar_session_id.set(session_id)
 25 |     try:
 26 |         yield
 27 |     finally:
 28 |         cvar_session_id.reset(token)
 29 | 
 30 | 
 31 | class Embeddable(BaseModel):
 32 |     embedding: list[float] | None = Field(default=None, repr=False)
 33 | 
 34 | 
 35 | class LLMResult(BaseModel):
 36 |     """A class to hold the result of a LLM completion.
 37 | 
 38 |     To associate a group of LLMResults, you can use the `set_llm_session_ids` context manager:
 39 | 
 40 |     ```python
 41 |     my_session_id = uuid4()
 42 |     with set_llm_session_ids(my_session_id):
 43 |         # code that generates LLMResults
 44 |         pass
 45 |     ```
 46 | 
 47 |     and all the LLMResults generated within the context will have the same `session_id`.
 48 |     This can be combined with LLMModels `llm_result_callback` to store all LLMResults.
 49 |     """
 50 | 
 51 |     model_config = ConfigDict(populate_by_name=True)
 52 | 
 53 |     id: UUID = Field(default_factory=uuid4)
 54 |     session_id: UUID | None = Field(
 55 |         default_factory=cvar_session_id.get,  # type: ignore[arg-type]
 56 |         description="A persistent ID to associate a group of LLMResults",
 57 |         alias="answer_id",
 58 |     )
 59 |     name: str | None = None
 60 |     config: dict | None = None
 61 |     prompt: str | list[dict] | Message | list[Message] | None = Field(
 62 |         default=None,
 63 |         description="Optional prompt or list of serialized prompts.",
 64 |     )
 65 |     text: str | None = None
 66 |     messages: list[Message] | None = Field(
 67 |         default=None, description="Messages received from the LLM."
 68 |     )
 69 |     prompt_count: int = 0
 70 |     completion_count: int = 0
 71 |     model: str
 72 |     date: str = Field(default_factory=datetime.now().isoformat)
 73 |     seconds_to_first_token: float = Field(
 74 |         default=0.0, description="Delta time (sec) to first response token's arrival."
 75 |     )
 76 |     seconds_to_last_token: float = Field(
 77 |         default=0.0, description="Delta time (sec) to last response token's arrival."
 78 |     )
 79 |     logprob: float | None = Field(
 80 |         default=None, description="Sum of logprobs in the completion."
 81 |     )
 82 |     reasoning_content: str | None = Field(
 83 |         default=None, description="Reasoning content from LLMs such as DeepSeek-R1."
 84 |     )
 85 | 
 86 |     def __str__(self) -> str:
 87 |         return self.text or ""
 88 | 
 89 |     @computed_field  # type: ignore[prop-decorator]
 90 |     @property
 91 |     def cost(self) -> float:
 92 |         """Return the cost of the result in dollars."""
 93 |         if self.prompt_count and self.completion_count:
 94 |             try:
 95 |                 pc = litellm.model_cost[self.model]["input_cost_per_token"]
 96 |                 oc = litellm.model_cost[self.model]["output_cost_per_token"]
 97 |                 return pc * self.prompt_count + oc * self.completion_count
 98 |             except KeyError:
 99 |                 logger.warning(f"Could not find cost for model {self.model}.")
100 |         return 0.0
101 | 
102 |     # TODO: These two methods were implemented in ldp, but not in pqa.
103 |     # TODO: Check if they're necessary
104 |     @property
105 |     def provider(self) -> str:
106 |         """Get the model provider's name (e.g. "openai", "mistral")."""
107 |         return litellm.get_llm_provider(self.model)[1]
108 | 
109 |     def get_supported_openai_params(self) -> list[str] | None:
110 |         """Get the supported OpenAI parameters for the model."""
111 |         return litellm.get_supported_openai_params(self.model)
112 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Future-House/ldp/2e9557233dc0e4c8abbb9f1f065059108a0dcfcd/packages/lmi/tests/__init__.py


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestLiteLLMModel.test_cost_call[Anthropic-model].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"model": "claude-3-5-haiku-20241022", "messages": [{"role": "user", "content":
 5 |         [{"type": "text", "text": "What is the meaning of the universe?"}]}], "temperature":
 6 |         0, "max_tokens": 56, "system": [{"type": "text", "text": "Respond with single
 7 |         words."}]}'
 8 |       headers:
 9 |         accept:
10 |           - application/json
11 |         accept-encoding:
12 |           - gzip, deflate
13 |         anthropic-version:
14 |           - "2023-06-01"
15 |         connection:
16 |           - keep-alive
17 |         content-length:
18 |           - "253"
19 |         content-type:
20 |           - application/json
21 |         host:
22 |           - api.anthropic.com
23 |         user-agent:
24 |           - litellm/1.59.5
25 |       method: POST
26 |       uri: https://api.anthropic.com/v1/messages
27 |     response:
28 |       body:
29 |         string: !!binary |
30 |           H4sIAAAAAAAAA2SOMWvDMBSE/8vNcrDVplCNXbpkrOkQilDkRyLbeXKkJ9Ji/N+LQwMtnQ7uuztu
31 |           RuhgcM5HWzdtv7vu0uHSvz21L8+U3g/9KzdQkK+J1hTl7I4EhRTH1XA5hyyOBQrn2NEIAz+60lH1
32 |           UG2rkwtDqXStH5taayj4yEIsMPv5vin0ubZvYtDywPHKGywfClniZBO5HBkGxJ2Vkhg/INOlEHuC
33 |           4TKOCuV2zcwIPBWxEgfiDKMbBe/8iaxP5CREtn8D9Z0nct1/Fov8drbL8g0AAP//AwD1M9oFMwEA
34 |           AA==
35 |       headers:
36 |         CF-RAY:
37 |           - 909370809f0f15e3-SJC
38 |         Connection:
39 |           - keep-alive
40 |         Content-Encoding:
41 |           - gzip
42 |         Content-Type:
43 |           - application/json
44 |         Date:
45 |           - Tue, 28 Jan 2025 19:37:51 GMT
46 |         Server:
47 |           - cloudflare
48 |         Transfer-Encoding:
49 |           - chunked
50 |         X-Robots-Tag:
51 |           - none
52 |         anthropic-ratelimit-input-tokens-limit:
53 |           - "5000000"
54 |         anthropic-ratelimit-input-tokens-remaining:
55 |           - "5000000"
56 |         anthropic-ratelimit-input-tokens-reset:
57 |           - "2025-01-28T19:37:51Z"
58 |         anthropic-ratelimit-output-tokens-limit:
59 |           - "1000000"
60 |         anthropic-ratelimit-output-tokens-remaining:
61 |           - "1000000"
62 |         anthropic-ratelimit-output-tokens-reset:
63 |           - "2025-01-28T19:37:51Z"
64 |         anthropic-ratelimit-requests-limit:
65 |           - "5000"
66 |         anthropic-ratelimit-requests-remaining:
67 |           - "4999"
68 |         anthropic-ratelimit-requests-reset:
69 |           - "2025-01-28T19:37:51Z"
70 |         anthropic-ratelimit-tokens-limit:
71 |           - "6000000"
72 |         anthropic-ratelimit-tokens-remaining:
73 |           - "6000000"
74 |         anthropic-ratelimit-tokens-reset:
75 |           - "2025-01-28T19:37:51Z"
76 |         cf-cache-status:
77 |           - DYNAMIC
78 |         request-id:
79 |           - req_01Eppf1xbA8q5A3TkRYsr68g
80 |         via:
81 |           - 1.1 google
82 |       status:
83 |         code: 200
84 |         message: OK
85 | version: 1
86 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestLiteLLMModel.test_cost_call[OpenAI-model].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "What is the meaning of the universe?"}], "model":
  6 |         "gpt-4o-mini-2024-07-18", "max_tokens": 56, "temperature": 0}'
  7 |       headers:
  8 |         accept:
  9 |           - application/json
 10 |         accept-encoding:
 11 |           - gzip, deflate
 12 |         connection:
 13 |           - keep-alive
 14 |         content-length:
 15 |           - "215"
 16 |         content-type:
 17 |           - application/json
 18 |         host:
 19 |           - api.openai.com
 20 |         user-agent:
 21 |           - AsyncOpenAI/Python 1.60.0
 22 |         x-stainless-arch:
 23 |           - arm64
 24 |         x-stainless-async:
 25 |           - async:asyncio
 26 |         x-stainless-lang:
 27 |           - python
 28 |         x-stainless-os:
 29 |           - MacOS
 30 |         x-stainless-package-version:
 31 |           - 1.60.0
 32 |         x-stainless-raw-response:
 33 |           - "true"
 34 |         x-stainless-retry-count:
 35 |           - "0"
 36 |         x-stainless-runtime:
 37 |           - CPython
 38 |         x-stainless-runtime-version:
 39 |           - 3.11.10
 40 |       method: POST
 41 |       uri: https://api.openai.com/v1/chat/completions
 42 |     response:
 43 |       body:
 44 |         string: !!binary |
 45 |           H4sIAAAAAAAAAwAAAP//jJJBT+MwEIXv+RXWnBuUlqKU3jhwQHBgkRAHhCLXniSmjseyJ7usUP87
 46 |           clKaIFhpLznMN+/lzXjeMyHAaNgKUK1k1XmbX/W23fx6etjvLx4e63b55zEEurm7vLnt6B4WSUG7
 47 |           V1T8qTpT1HmLbMiNWAWUjMl1WZ5visvzoiwG0JFGm2SN53xNeWecyVfFap0XZb7cHNUtGYURtuI5
 48 |           E0KI9+GbcjqNb7AVg9dQ6TBG2SBsT01CQCCbKiBjNJGlY1hMUJFjdEP06zcTGZ3Cs3lDwLqPMoV0
 49 |           vbXH+uH0R0uND7SLR36q18aZ2FYBZSSX3COTh4EeMiFehsn6L2HBB+o8V0x7dMlwtR7tYNrnBD8Z
 50 |           E0s702wWP5hVGlkaG2eLASVVi3pSTluUvTY0A9ls5O9ZfvIexzau+R/7CSiFnlFXPqA26uu8U1vA
 51 |           dGz/ajuteAgMEcNvo7BigyE9g8Za9nY8AYh/I2NX1cY1GHww4x3UvipXqEu5u1gryA7ZBwAAAP//
 52 |           AwC1HS6hFQMAAA==
 53 |       headers:
 54 |         CF-Cache-Status:
 55 |           - DYNAMIC
 56 |         CF-RAY:
 57 |           - 9093707c3c60174a-SJC
 58 |         Connection:
 59 |           - keep-alive
 60 |         Content-Encoding:
 61 |           - gzip
 62 |         Content-Type:
 63 |           - application/json
 64 |         Date:
 65 |           - Tue, 28 Jan 2025 19:37:51 GMT
 66 |         Server:
 67 |           - cloudflare
 68 |         Set-Cookie:
 69 |           - __cf_bm=dqIilPhCKBMWrfzBIKv4Z773uZfIHyMVkz9CwPgIUtA-1738093071-1.0.1.1-eLZ4cnMA8fb5u55VPgPzLBwaJH8MbcL3FaS_WIZ7m1Y2PPk00cpUZHpTcwEErfVXeYRqTRcDOGjb4niE.byJ3A;
 70 |             path=/; expires=Tue, 28-Jan-25 20:07:51 GMT; domain=.api.openai.com; HttpOnly;
 71 |             Secure; SameSite=None
 72 |           - _cfuvid=VubHV4jc3NAG1.KYK.9ezrasy_FR9RQDSt8gSdEubnM-1738093071389-0.0.1.1-604800000;
 73 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 74 |         Transfer-Encoding:
 75 |           - chunked
 76 |         X-Content-Type-Options:
 77 |           - nosniff
 78 |         access-control-expose-headers:
 79 |           - X-Request-ID
 80 |         alt-svc:
 81 |           - h3=":443"; ma=86400
 82 |         openai-organization:
 83 |           - future-house-xr4tdh
 84 |         openai-processing-ms:
 85 |           - "490"
 86 |         openai-version:
 87 |           - "2020-10-01"
 88 |         strict-transport-security:
 89 |           - max-age=31536000; includeSubDomains; preload
 90 |         x-ratelimit-limit-requests:
 91 |           - "30000"
 92 |         x-ratelimit-limit-tokens:
 93 |           - "150000000"
 94 |         x-ratelimit-remaining-requests:
 95 |           - "29999"
 96 |         x-ratelimit-remaining-tokens:
 97 |           - "149999926"
 98 |         x-ratelimit-reset-requests:
 99 |           - 2ms
100 |         x-ratelimit-reset-tokens:
101 |           - 0s
102 |         x-request-id:
103 |           - req_e0ce487241223e824cc737d821b5495c
104 |       status:
105 |         code: 200
106 |         message: OK
107 | version: 1
108 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestLiteLLMModel.test_max_token_truncation[with-router].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "Please tell me a story"}], "model":
  5 |         "gpt-4o-mini", "max_tokens": 3}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "110"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.46.1
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.46.1
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-runtime:
 34 |           - CPython
 35 |         x-stainless-runtime-version:
 36 |           - 3.12.7
 37 |       method: POST
 38 |       uri: https://api.openai.com/v1/chat/completions
 39 |     response:
 40 |       body:
 41 |         string: !!binary |
 42 |           H4sIAAAAAAAAA4ySUUvDMBSF3/srQp5b6bp13fomE3wRRBEUREqW3LaZaRKTFBxj/13SdmuHE3zJ
 43 |           w/3uOTn3JocAIcwZzhGmNXG00SK6fSNfyw1/TWdsV64fnjYZZC/ts7in+/oOh16htjug7qS6oarR
 44 |           AhxXssfUAHHgXWfZPEmX62y96kCjGAgvq7SLFipquORREieLKM6i2WpQ14pTsDhH7wFCCB260+eU
 45 |           DL5xjuLwVGnAWlIBzs9NCGGjhK9gYi23jkiHwxFSJR3ILvqjpIBarSQi0w4DZWuJTylbIYb68Xyl
 46 |           UJU2amsHfq6XXHJbFwaIVdLbC5CVq3HHjwFCH91w7UVerI1qtCuc+gTpLWdJb4jHlY5wPjCnHBET
 47 |           TRpeMSsYOMKFnewGU0JrYKNyXCRpGVcTEEyG/p3lmnc/OJfVf+xHQCloB6zQBhinl/OObQb8f/ur
 48 |           7bziLjC2e+ugKUouKzDa8P61S13EWZxuy1VGYxwcgx8AAAD//wMAIAzc+vsCAAA=
 49 |       headers:
 50 |         CF-Cache-Status:
 51 |           - DYNAMIC
 52 |         CF-RAY:
 53 |           - 8e84b2f90c81230e-SJC
 54 |         Connection:
 55 |           - keep-alive
 56 |         Content-Encoding:
 57 |           - gzip
 58 |         Content-Type:
 59 |           - application/json
 60 |         Date:
 61 |           - Mon, 25 Nov 2024 21:23:18 GMT
 62 |         Server:
 63 |           - cloudflare
 64 |         Set-Cookie:
 65 |           - __cf_bm=KqKw89zgaG32GNn3lg4IvjG2X2zLmPKRiY1oedcDUVM-1732569798-1.0.1.1-y_oblt_Jp3n1T.HtHFHrxbRegDqoC8gojQPBSV52IMBH.bx8c0QNAUrWotLzzQGqqbIDjdhl0AUutzvWk20psg;
 66 |             path=/; expires=Mon, 25-Nov-24 21:53:18 GMT; domain=.api.openai.com; HttpOnly;
 67 |             Secure; SameSite=None
 68 |           - _cfuvid=F_vLQWJJbY8GvEB4YIomOCy2NMswE7Ex8TL0Z4OIxgg-1732569798934-0.0.1.1-604800000;
 69 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 70 |         Transfer-Encoding:
 71 |           - chunked
 72 |         X-Content-Type-Options:
 73 |           - nosniff
 74 |         access-control-expose-headers:
 75 |           - X-Request-ID
 76 |         alt-svc:
 77 |           - h3=":443"; ma=86400
 78 |         openai-organization:
 79 |           - future-house-xr4tdh
 80 |         openai-processing-ms:
 81 |           - "256"
 82 |         openai-version:
 83 |           - "2020-10-01"
 84 |         strict-transport-security:
 85 |           - max-age=31536000; includeSubDomains; preload
 86 |         x-ratelimit-limit-requests:
 87 |           - "30000"
 88 |         x-ratelimit-limit-tokens:
 89 |           - "150000000"
 90 |         x-ratelimit-remaining-requests:
 91 |           - "29997"
 92 |         x-ratelimit-remaining-tokens:
 93 |           - "149998170"
 94 |         x-ratelimit-reset-requests:
 95 |           - 4ms
 96 |         x-ratelimit-reset-tokens:
 97 |           - 0s
 98 |         x-request-id:
 99 |           - req_77977a66fa96e40ffe5c3bc7840c0948
100 |       status:
101 |         code: 200
102 |         message: OK
103 | version: 1
104 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestLiteLLMModel.test_max_token_truncation[without-router].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "Please tell me a story"}], "model":
  5 |         "gpt-4o-mini", "max_tokens": 3}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "110"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.46.1
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.46.1
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-runtime:
 34 |           - CPython
 35 |         x-stainless-runtime-version:
 36 |           - 3.12.7
 37 |       method: POST
 38 |       uri: https://api.openai.com/v1/chat/completions
 39 |     response:
 40 |       body:
 41 |         string: !!binary |
 42 |           H4sIAAAAAAAAA4ySMW+DMBCFd36F5RkqQkJI2DpnqBSpUtqqQo59gFtju7aRkkb575UhAaKmUhcP
 43 |           9917fnf2KUAIc4ZzhGlNHG20iB535GvewmZ53MR8szhu29ftLnmx3/T5UOHQK9T+A6i7qh6oarQA
 44 |           x5XsMTVAHHjXWTZP0uU6W6cdaBQD4WWVdtFCRQ2XPEriZBHFWTRbXdS14hQsztFbgBBCp+70OSWD
 45 |           A85RHF4rDVhLKsD50IQQNkr4CibWcuuIdDgcIVXSgeyiP0kKqNVKIjLtMFC2lviUshXiUj8PVwpV
 46 |           aaP29sKHesklt3VhgFglvb0AWbkad/wcIPTeDdfe5MXaqEa7wqlPkN5ylvSGeFzpCOcX5pQjYqJJ
 47 |           wztmBQNHuLCT3WBKaA1sVI6LJC3jagKCydC/s9zz7gfnsvqP/QgoBe2AFdoA4/R23rHNgP9vf7UN
 48 |           K+4CY3u0Dpqi5LICow3vX7vURZzF6b5cZTTGwTn4AQAA//8DAGJIF8n7AgAA
 49 |       headers:
 50 |         CF-Cache-Status:
 51 |           - DYNAMIC
 52 |         CF-RAY:
 53 |           - 8e84b2e46a3e5c18-SJC
 54 |         Connection:
 55 |           - keep-alive
 56 |         Content-Encoding:
 57 |           - gzip
 58 |         Content-Type:
 59 |           - application/json
 60 |         Date:
 61 |           - Mon, 25 Nov 2024 21:23:15 GMT
 62 |         Server:
 63 |           - cloudflare
 64 |         Set-Cookie:
 65 |           - __cf_bm=pmbS4O0SdzCjzvZjensXpq5w1I1GUEOUOh_2ExJ8_Rc-1732569795-1.0.1.1-RsW0ExCXu..OFPcHXSvL3vh7_PqZu9gX0DgJI0BGjr2oborEPzdC6ZSsqZTfP9zf3YOigH1hcfDePksbYyIO8A;
 66 |             path=/; expires=Mon, 25-Nov-24 21:53:15 GMT; domain=.api.openai.com; HttpOnly;
 67 |             Secure; SameSite=None
 68 |           - _cfuvid=v_wT.VKOzzmIot1JtDgHglmHPmgOB.YvZxQznjpUEiA-1732569795663-0.0.1.1-604800000;
 69 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 70 |         Transfer-Encoding:
 71 |           - chunked
 72 |         X-Content-Type-Options:
 73 |           - nosniff
 74 |         access-control-expose-headers:
 75 |           - X-Request-ID
 76 |         alt-svc:
 77 |           - h3=":443"; ma=86400
 78 |         openai-organization:
 79 |           - future-house-xr4tdh
 80 |         openai-processing-ms:
 81 |           - "150"
 82 |         openai-version:
 83 |           - "2020-10-01"
 84 |         strict-transport-security:
 85 |           - max-age=31536000; includeSubDomains; preload
 86 |         x-ratelimit-limit-requests:
 87 |           - "30000"
 88 |         x-ratelimit-limit-tokens:
 89 |           - "150000000"
 90 |         x-ratelimit-remaining-requests:
 91 |           - "29999"
 92 |         x-ratelimit-remaining-tokens:
 93 |           - "149999990"
 94 |         x-ratelimit-reset-requests:
 95 |           - 2ms
 96 |         x-ratelimit-reset-tokens:
 97 |           - 0s
 98 |         x-request-id:
 99 |           - req_817b41328aed9a1e4a84bd7ec79e22f7
100 |       status:
101 |         code: 200
102 |         message: OK
103 | version: 1
104 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestMultipleCompletion.test_model[gpt-3.5-turbo-0125].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "Hello, how are you?"}], "model": "gpt-3.5-turbo-0125",
  6 |         "max_tokens": 4096, "n": 2, "temperature": 0.1}'
  7 |       headers:
  8 |         accept:
  9 |           - application/json
 10 |         accept-encoding:
 11 |           - gzip, deflate
 12 |         connection:
 13 |           - keep-alive
 14 |         content-length:
 15 |           - "206"
 16 |         content-type:
 17 |           - application/json
 18 |         host:
 19 |           - api.openai.com
 20 |         user-agent:
 21 |           - AsyncOpenAI/Python 1.60.0
 22 |         x-stainless-arch:
 23 |           - arm64
 24 |         x-stainless-async:
 25 |           - async:asyncio
 26 |         x-stainless-lang:
 27 |           - python
 28 |         x-stainless-os:
 29 |           - MacOS
 30 |         x-stainless-package-version:
 31 |           - 1.60.0
 32 |         x-stainless-raw-response:
 33 |           - "true"
 34 |         x-stainless-retry-count:
 35 |           - "0"
 36 |         x-stainless-runtime:
 37 |           - CPython
 38 |         x-stainless-runtime-version:
 39 |           - 3.12.4
 40 |       method: POST
 41 |       uri: https://api.openai.com/v1/chat/completions
 42 |     response:
 43 |       body:
 44 |         string: !!binary |
 45 |           H4sIAAAAAAAAAwAAAP//1FPLTsMwELznKyyfm6oPSqE3JCQOcELihFDk2NvUxfEa7wYBFf+OnLRN
 46 |           UEHiyiWHmZ3J7MO7TAhpjVwJqTeKdR1cfkXb8rq2lb29O79Xdx+3b01J6uHhZQsXUY6SAsstaD6o
 47 |           xhrr4IAt+o7WERRDcp0u58vzycV8cdkSNRpwSVYFzufjRc5NLDGfTGeLvXKDVgPJlXjMhBBi135T
 48 |           Rm/gTa7EZHRAaiBSFcjVsUgIGdElRCoiS6w8y1FPavQMvo19g2iGVIR1QypF841ze/zz+C+HVYhY
 49 |           0p4/4mvrLW2KCIrQJ19iDDIbiE8amP6bBjIhntqlNN9iyhCxDlwwPoNPhrNZZyf7MxiQe46RlRvA
 50 |           Z6MfzAoDrKyjwUikVnoDplf2B6AaY3FADMd+muUn765t66u/2PeE1hAYTBEiGKu/99uXRUhv5Ley
 51 |           44jbwJIgvloNBVuIaQ0G1qpx3fIlvRNDXaytryCGaNsLaNf8mX0BAAD//wMAWjXvTcEDAAA=
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 906536b37c63679b-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Thu, 23 Jan 2025 04:59:19 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=bbe91RL8pynoc8FwJWONXTz9iPs24xtiuVm.KiZccgg-1737608359-1.0.1.1-4MY0muOtVyYr8hyafTjKQEnS6CzShHD_gr1zV4jE0BX8Q7GKl0jg.CfuuJAejDm7ssESqqnEFdi90KdjJqX0iA;
 69 |             path=/; expires=Thu, 23-Jan-25 05:29:19 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=fVO2Os4JLfnO.SjLcpo.a17BzAYLtUPKLCrieYjvhQo-1737608359268-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         openai-organization:
 82 |           - future-house-xr4tdh
 83 |         openai-processing-ms:
 84 |           - "212"
 85 |         openai-version:
 86 |           - "2020-10-01"
 87 |         strict-transport-security:
 88 |           - max-age=31536000; includeSubDomains; preload
 89 |         x-ratelimit-limit-requests:
 90 |           - "12000"
 91 |         x-ratelimit-limit-tokens:
 92 |           - "1000000"
 93 |         x-ratelimit-remaining-requests:
 94 |           - "11999"
 95 |         x-ratelimit-remaining-tokens:
 96 |           - "991822"
 97 |         x-ratelimit-reset-requests:
 98 |           - 5ms
 99 |         x-ratelimit-reset-tokens:
100 |           - 490ms
101 |         x-request-id:
102 |           - req_d5da645d9bde91ef8bbcd32b1d58cb33
103 |       status:
104 |         code: 200
105 |         message: OK
106 | version: 1
107 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestMultipleCompletion.test_model[gpt-3.5-turbo].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "Hello, how are you?"}], "model": "gpt-3.5-turbo"}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "153"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.59.7
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.59.7
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAAwAAAP//jJJPT8MwDMXv/RRRzt20v0zaDXEYQmgHJMQBoSpLvDYsjUPibqBp3x2l
 45 |           LWsnhsSlh/ezX5/tHBPGuFZ8ybgsBMnSmcHtx+7uxdyv5Wo3Wz/A0wGfZyu3f8z3CzrwNHbg5h0k
 46 |           /XQNJZbOAGm0DZYeBEF0HS+mi/F0Nhrf1KBEBSa25Y4G0+F8QJXf4GA0nszbzgK1hMCX7DVhjLFj
 47 |           /Y0ZrYJPvmSj9EcpIQSRA1+eixjjHk1UuAhBBxKWeNpBiZbA1rFXiKqPPGyrIGI0WxnT6qfzvwzm
 48 |           zuMmtPysb7XVocg8iIA2+gZCx2t6Shh7q2eqLmJy57F0lBHuwEbDyaSx490We7BlhCRMT56lV8wy
 49 |           BSS0Cb2VcClkAarr7PYnKqWxB5LeyL+zXPNuxtY2/499B6QER6Ay50FpeTlvV+YhPrG/ys4rrgPz
 50 |           AH6vJWSkwcczKNiKyjTH5+ErEJTZVtscvPO6fgH1mU/JNwAAAP//AwAmgFaGAAMAAA==
 51 |       headers:
 52 |         CF-Cache-Status:
 53 |           - DYNAMIC
 54 |         CF-RAY:
 55 |           - 9037fa12aa64ebe5-SJC
 56 |         Connection:
 57 |           - keep-alive
 58 |         Content-Encoding:
 59 |           - gzip
 60 |         Content-Type:
 61 |           - application/json
 62 |         Date:
 63 |           - Fri, 17 Jan 2025 17:13:36 GMT
 64 |         Server:
 65 |           - cloudflare
 66 |         Set-Cookie:
 67 |           - __cf_bm=sBEhET_ucmEw1fj49k97O6lYPFKpa8FC7g85fCwHQdA-1737134016-1.0.1.1-Y2pqd.8untxxrd4CV3MVcvrzkxtXf7VBF717.ygynQmR3B_Hl_YvH2o4zsYUQFj75ENY35qzY8hjkF3qGvyZOw;
 68 |             path=/; expires=Fri, 17-Jan-25 17:43:36 GMT; domain=.api.openai.com; HttpOnly;
 69 |             Secure; SameSite=None
 70 |           - _cfuvid=.OXPSLgaNOtRCwyCdctf7AFOBazBNO8OQRpV77U6rCM-1737134016656-0.0.1.1-604800000;
 71 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 72 |         Transfer-Encoding:
 73 |           - chunked
 74 |         X-Content-Type-Options:
 75 |           - nosniff
 76 |         access-control-expose-headers:
 77 |           - X-Request-ID
 78 |         alt-svc:
 79 |           - h3=":443"; ma=86400
 80 |         openai-organization:
 81 |           - future-house-xr4tdh
 82 |         openai-processing-ms:
 83 |           - "133"
 84 |         openai-version:
 85 |           - "2020-10-01"
 86 |         strict-transport-security:
 87 |           - max-age=31536000; includeSubDomains; preload
 88 |         x-ratelimit-limit-requests:
 89 |           - "12000"
 90 |         x-ratelimit-limit-tokens:
 91 |           - "1000000"
 92 |         x-ratelimit-remaining-requests:
 93 |           - "11999"
 94 |         x-ratelimit-remaining-tokens:
 95 |           - "999969"
 96 |         x-ratelimit-reset-requests:
 97 |           - 5ms
 98 |         x-ratelimit-reset-tokens:
 99 |           - 1ms
100 |         x-request-id:
101 |           - req_e1b9df957943f220f9b008b98d8d4ad3
102 |       status:
103 |         code: 200
104 |         message: OK
105 | version: 1
106 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestMultipleCompletion.test_model[gpt-4o-mini-2024-07-18].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "Hello, how are you?"}], "model": "gpt-4o-mini-2024-07-18",
  6 |         "max_tokens": 4096, "n": 2, "temperature": 0.1}'
  7 |       headers:
  8 |         accept:
  9 |           - application/json
 10 |         accept-encoding:
 11 |           - gzip, deflate
 12 |         connection:
 13 |           - keep-alive
 14 |         content-length:
 15 |           - "210"
 16 |         content-type:
 17 |           - application/json
 18 |         host:
 19 |           - api.openai.com
 20 |         user-agent:
 21 |           - AsyncOpenAI/Python 1.59.4
 22 |         x-stainless-arch:
 23 |           - arm64
 24 |         x-stainless-async:
 25 |           - async:asyncio
 26 |         x-stainless-lang:
 27 |           - python
 28 |         x-stainless-os:
 29 |           - MacOS
 30 |         x-stainless-package-version:
 31 |           - 1.59.4
 32 |         x-stainless-raw-response:
 33 |           - "true"
 34 |         x-stainless-retry-count:
 35 |           - "0"
 36 |         x-stainless-runtime:
 37 |           - CPython
 38 |         x-stainless-runtime-version:
 39 |           - 3.12.7
 40 |       method: POST
 41 |       uri: https://api.openai.com/v1/chat/completions
 42 |     response:
 43 |       body:
 44 |         string: !!binary |
 45 |           H4sIAAAAAAAAAwAAAP//1FPBatwwEL37K9Q5r8va3bXD3paE5tDeWgqlFKOVxrZSWSOkcUkJ+fci
 46 |           e7N2SAq95uLDvHnP782MHjIhwGg4CFC9ZDV4mx/j9693lf/YX8fjpxs1fj59+cb37W11LMMNbBKD
 47 |           Tneo+In1XtHgLbIhN8MqoGRMqkX9od5X+6ooJmAgjTbROs/5jvLBOJOX23KXb+u8uDqzezIKIxzE
 48 |           j0wIIR6mb/LpNN7DQWw3T5UBY5QdwuHSJAQEsqkCMkYTWTqGzQIqcoxusn5LpN+tsYDtGGXy50Zr
 49 |           z/XHy88sdT7QKZ7xS701zsS+CSgjuSQcmTxkK/KLBMXbSZAJ8XNay/jMJ/hAg+eG6Re6JFiWsxws
 50 |           x7CA1RljYmlXnKvNK2KNRpbGxtVMQEnVo16YywnIURtaAeu5v/TymvYc27juf+QXQCn0jLrxAbVR
 51 |           z/MubQHTS/lX22XEk2GIGH4bhQ0bDGkNGls52nn7EP9ExqFpjesw+GDmE2h9U5eoa3na7xRkj9lf
 52 |           AAAA//8DAL+Guu3SAwAA
 53 |       headers:
 54 |         CF-RAY:
 55 |           - 906123104eef6804-SJC
 56 |         Connection:
 57 |           - keep-alive
 58 |         Content-Encoding:
 59 |           - gzip
 60 |         Content-Type:
 61 |           - application/json
 62 |         Date:
 63 |           - Wed, 22 Jan 2025 17:06:52 GMT
 64 |         Server:
 65 |           - cloudflare
 66 |         Set-Cookie:
 67 |           - __cf_bm=0AU5UBKcyJz8Is5N3AXFGiVfs40PPUx5w39vHFzp8ZE-1737565612-1.0.1.1-i3ipRUtk3POiwcBFVN_BwKvHxpOBDsWu0rNxwUC2FDSvaO0r5Ye.s9_FdZkNSKdiC.dRJRy5LbqjCCll.G26oQ;
 68 |             path=/; expires=Wed, 22-Jan-25 17:36:52 GMT; domain=.api.openai.com; HttpOnly;
 69 |             Secure; SameSite=None
 70 |           - _cfuvid=_hKYeboiOAsgsNVboFQJcjY4DMG.3STQtZ6iRMz1QOU-1737565612020-0.0.1.1-604800000;
 71 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 72 |         Transfer-Encoding:
 73 |           - chunked
 74 |         X-Content-Type-Options:
 75 |           - nosniff
 76 |         access-control-expose-headers:
 77 |           - X-Request-ID
 78 |         alt-svc:
 79 |           - h3=":443"; ma=86400
 80 |         cf-cache-status:
 81 |           - DYNAMIC
 82 |         openai-organization:
 83 |           - future-house-xr4tdh
 84 |         openai-processing-ms:
 85 |           - "338"
 86 |         openai-version:
 87 |           - "2020-10-01"
 88 |         strict-transport-security:
 89 |           - max-age=31536000; includeSubDomains; preload
 90 |         x-ratelimit-limit-requests:
 91 |           - "30000"
 92 |         x-ratelimit-limit-tokens:
 93 |           - "150000000"
 94 |         x-ratelimit-remaining-requests:
 95 |           - "29999"
 96 |         x-ratelimit-remaining-tokens:
 97 |           - "149991793"
 98 |         x-ratelimit-reset-requests:
 99 |           - 2ms
100 |         x-ratelimit-reset-tokens:
101 |           - 3ms
102 |         x-request-id:
103 |           - req_af628db22df56361b4e04d5bf342574d
104 |       status:
105 |         code: 200
106 |         message: OK
107 | version: 1
108 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestMultipleCompletion.test_model[gpt-4o-mini].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "Hello, how are you?"}], "model": "gpt-4o-mini"}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "151"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.59.7
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.59.7
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAA4ySQW/UMBCF7/kVZs4blE2Wbrs3pAq4IcQBJIQirz1J3NoeY09QUbX/HTnZblK1
 45 |           SFx8mG/e85uxHwshwGg4CFCDZOWCLd//ur+lB3d0Oz987VMlu+/WfPl2++HT5zsNm6yg4x0qflK9
 46 |           VeSCRTbkZ6wiSsbsut03+22zq26uJuBIo82yPnC5o9IZb8q6qndltS+312f1QEZhgoP4UQghxON0
 47 |           5pxe4wMcRLV5qjhMSfYIh0uTEBDJ5grIlExi6Rk2C1TkGf0U/SORfrNmEbsxyZzPj9ae66fLZZb6
 48 |           EOmYzvxS74w3aWgjykQ+GyemABM9FUL8nIYan+WEEMkFbpnu0WfDup7tYFnlApszY2JpV5p3m1fM
 49 |           Wo0sjU2rnYCSakC9KJcFylEbWoFiNfLLLK95z2Mb3/+P/QKUwsCo2xBRG/V83qUtYv5n/2q7rHgK
 50 |           DAnjb6OwZYMxP4PGTo52fn1IfxKjazvje4whmvkLdKE96uumqW+6qwaKU/EXAAD//wMAQaS4thAD
 51 |           AAA=
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 9037fc09580bd045-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Fri, 17 Jan 2025 17:14:57 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=HlSNS.gT._y7cHrNqXSekKB0MjIrTa0AaS0nE.welTg-1737134097-1.0.1.1-o2GwXAUWpjygAFlkSQqTOJk9PIvrzfkL5hcC4C_ebboFSTvSb8e0018Z42ilOx18M.vaCSWqF.oh861HSvq85Q;
 69 |             path=/; expires=Fri, 17-Jan-25 17:44:57 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=KHvEM4IFbWYj2GdNChMj5sEdEejFcK_8z8SFW.hDqvY-1737134097138-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         openai-organization:
 82 |           - future-house-xr4tdh
 83 |         openai-processing-ms:
 84 |           - "166"
 85 |         openai-version:
 86 |           - "2020-10-01"
 87 |         strict-transport-security:
 88 |           - max-age=31536000; includeSubDomains; preload
 89 |         x-ratelimit-limit-requests:
 90 |           - "30000"
 91 |         x-ratelimit-limit-tokens:
 92 |           - "150000000"
 93 |         x-ratelimit-remaining-requests:
 94 |           - "29999"
 95 |         x-ratelimit-remaining-tokens:
 96 |           - "149999970"
 97 |         x-ratelimit-reset-requests:
 98 |           - 2ms
 99 |         x-ratelimit-reset-tokens:
100 |           - 0s
101 |         x-request-id:
102 |           - req_a304ff40cdb7bf3c789644e502d1651d
103 |       status:
104 |         code: 200
105 |         message: OK
106 | version: 1
107 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestTooling.test_empty_tools[Anthropic-empty-tools].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"model": "claude-3-5-haiku-20241022", "messages": [{"role": "user", "content":
 5 |         [{"type": "text", "text": "What does 42 mean?"}]}], "temperature": 0.1, "max_tokens":
 6 |         56}'
 7 |       headers:
 8 |         accept:
 9 |           - application/json
10 |         accept-encoding:
11 |           - gzip, deflate
12 |         anthropic-version:
13 |           - "2023-06-01"
14 |         connection:
15 |           - keep-alive
16 |         content-length:
17 |           - "169"
18 |         content-type:
19 |           - application/json
20 |         host:
21 |           - api.anthropic.com
22 |         user-agent:
23 |           - litellm/1.59.5
24 |       method: POST
25 |       uri: https://api.anthropic.com/v1/messages
26 |     response:
27 |       body:
28 |         string: !!binary |
29 |           H4sIAAAAAAAAAwAAAP//ZJFNj9NADIb/iuXLXqaoDW0FuVXa1YLgggQHRFHknTjJkMk4jGe6zVb9
30 |           7yiBSiBOlv28/r6gq7HEQdtqvfnAstu//Hjzss+br/eH3L49dZOgwTSNPKtYlVpGg1H8HCBVp4lC
31 |           QoOD1OyxROsp17x6vdqtOnJ9XhXrYrtZFwUatBISh4Tlt8utZuLznL2YErcFOIWGBsnqJ+iDPAdo
32 |           ogxwL7n1pHCoadA7UOs4WIbG2eQkgJWB6wmeRHo44ueO4Z1Ltutcz/FO4TG7miEJpI7hkTydpyMC
33 |           6eIf8RD0meONf/HJDZQYPmXWpbo08NE1bH7j4E4clQ1QqOHhxHFKnQvtqyPC+7BI5jEMEGgeOVoZ
34 |           xpw4giVvs6fEc1unQEtXvH43qEnGKjKphPnOdK6S9BwU/yDln3neF8uQvTeYlz+UF3RhzOkmLjdb
35 |           g5Zsx5WNTPPo1b+C9Y1Hpvp/Jjn9Hdntr9dfAAAA//8DAPISxfshAgAA
36 |       headers:
37 |         CF-RAY:
38 |           - 910ad9db995ded38-SJC
39 |         Connection:
40 |           - keep-alive
41 |         Content-Encoding:
42 |           - gzip
43 |         Content-Type:
44 |           - application/json
45 |         Date:
46 |           - Wed, 12 Feb 2025 07:26:33 GMT
47 |         Server:
48 |           - cloudflare
49 |         Transfer-Encoding:
50 |           - chunked
51 |         X-Robots-Tag:
52 |           - none
53 |         anthropic-ratelimit-input-tokens-limit:
54 |           - "5000000"
55 |         anthropic-ratelimit-input-tokens-remaining:
56 |           - "5000000"
57 |         anthropic-ratelimit-input-tokens-reset:
58 |           - "2025-02-12T07:26:32Z"
59 |         anthropic-ratelimit-output-tokens-limit:
60 |           - "1000000"
61 |         anthropic-ratelimit-output-tokens-remaining:
62 |           - "1000000"
63 |         anthropic-ratelimit-output-tokens-reset:
64 |           - "2025-02-12T07:26:33Z"
65 |         anthropic-ratelimit-requests-limit:
66 |           - "5000"
67 |         anthropic-ratelimit-requests-remaining:
68 |           - "4999"
69 |         anthropic-ratelimit-requests-reset:
70 |           - "2025-02-12T07:26:32Z"
71 |         anthropic-ratelimit-tokens-limit:
72 |           - "6000000"
73 |         anthropic-ratelimit-tokens-remaining:
74 |           - "6000000"
75 |         anthropic-ratelimit-tokens-reset:
76 |           - "2025-02-12T07:26:32Z"
77 |         cf-cache-status:
78 |           - DYNAMIC
79 |         request-id:
80 |           - req_014o74duDsmRJrXujBWdcNDt
81 |         via:
82 |           - 1.1 google
83 |       status:
84 |         code: 200
85 |         message: OK
86 | version: 1
87 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestTooling.test_empty_tools[Anthropic-no-tools].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"model": "claude-3-5-haiku-20241022", "messages": [{"role": "user", "content":
 5 |         [{"type": "text", "text": "What does 42 mean?"}]}], "temperature": 0.1, "max_tokens":
 6 |         56}'
 7 |       headers:
 8 |         accept:
 9 |           - application/json
10 |         accept-encoding:
11 |           - gzip, deflate
12 |         anthropic-version:
13 |           - "2023-06-01"
14 |         connection:
15 |           - keep-alive
16 |         content-length:
17 |           - "169"
18 |         content-type:
19 |           - application/json
20 |         host:
21 |           - api.anthropic.com
22 |         user-agent:
23 |           - litellm/1.59.5
24 |       method: POST
25 |       uri: https://api.anthropic.com/v1/messages
26 |     response:
27 |       body:
28 |         string: !!binary |
29 |           H4sIAAAAAAAAA2SRwYrbQAyGX0XoshenJG42Bd8WUjYtSyGwPTXFTMeyZ/B45I40u3FD3r3YbWBL
30 |           T0L6folf0gV9gxUO0tXrzdOB7fFYfvm8a3dx82F7yOr2v7BAnUaaVSRiOsICE4e5YES8qImKBQ7c
31 |           UMAKbTC5odX71f3KGd/nVbkut5t1WWKBlqNSVKy+XW4zlc5z9xIq3JbgBVozcJYwQR/5NUKbeIA9
32 |           5y4YgYfGDHIHYj1FS9B6q54jWB6omeAHcw8nfHYEB6/WOd9TuhN4zL4hUAZ1BI8mmPN0QjCy5Cd8
33 |           iPJK6ca/BvWDUYJjJlmmcwtPvqXiD47+hZJQASY28PGF0qTOx+7dCeFTXCSzjQIMSB4pWR7GrJTA
34 |           mhCogT3RCM+Oc+cUr98LFOWxTmSE43xkc66Ve4qCf5HQzzwvi1XMIRSYlydUF/RxzHoTV5ttgdZY
35 |           R7VNZGbf9b+C9Y0nMs3/jLO+rdzvrtffAAAA//8DAEH9A5MeAgAA
36 |       headers:
37 |         CF-RAY:
38 |           - 910ada053e7f689a-SJC
39 |         Connection:
40 |           - keep-alive
41 |         Content-Encoding:
42 |           - gzip
43 |         Content-Type:
44 |           - application/json
45 |         Date:
46 |           - Wed, 12 Feb 2025 07:26:40 GMT
47 |         Server:
48 |           - cloudflare
49 |         Transfer-Encoding:
50 |           - chunked
51 |         X-Robots-Tag:
52 |           - none
53 |         anthropic-ratelimit-input-tokens-limit:
54 |           - "5000000"
55 |         anthropic-ratelimit-input-tokens-remaining:
56 |           - "5000000"
57 |         anthropic-ratelimit-input-tokens-reset:
58 |           - "2025-02-12T07:26:39Z"
59 |         anthropic-ratelimit-output-tokens-limit:
60 |           - "1000000"
61 |         anthropic-ratelimit-output-tokens-remaining:
62 |           - "1000000"
63 |         anthropic-ratelimit-output-tokens-reset:
64 |           - "2025-02-12T07:26:40Z"
65 |         anthropic-ratelimit-requests-limit:
66 |           - "5000"
67 |         anthropic-ratelimit-requests-remaining:
68 |           - "4999"
69 |         anthropic-ratelimit-requests-reset:
70 |           - "2025-02-12T07:26:39Z"
71 |         anthropic-ratelimit-tokens-limit:
72 |           - "6000000"
73 |         anthropic-ratelimit-tokens-remaining:
74 |           - "6000000"
75 |         anthropic-ratelimit-tokens-reset:
76 |           - "2025-02-12T07:26:39Z"
77 |         cf-cache-status:
78 |           - DYNAMIC
79 |         request-id:
80 |           - req_014N65NM1873o5sdT25QAzx2
81 |         via:
82 |           - 1.1 google
83 |       status:
84 |         code: 200
85 |         message: OK
86 | version: 1
87 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestTooling.test_empty_tools[OpenAI-empty-tools].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "What does 42 mean?"}], "model":
  5 |         "gpt-4o-mini-2024-07-18", "max_tokens": 56, "n": 1, "temperature": 0.1}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "146"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.60.0
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.60.0
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.4
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAAwAAAP//jFNNb9swDL3nVxC69GIX+WzW3Dp0yzbssALbaRkMRaJtNrJkiHRbo+h/
 45 |           H2yncYZ1wC4G9B758MhHP08AFFm1AWVKLaaqXfp+Orsz23zbsKzu2y+8Xcy3324/PpkqHA4q6TrC
 46 |           /h6NvHZdmlDVDoWCH2gTUQt2qrP14nqxXM2upz1RBYuuaytqSZchrchTOp/Ol+l0nc7eHbvLQAZZ
 47 |           beDnBADguf92Pr3FJ7WBXqtHKmTWBarNqQhAxeA6RGlmYtFeVDKSJnhB31v/XiL4ptpjhOUciCHX
 48 |           VWjYtXDw4dGDZtgpKRFuPD9iBAnQvX44oUoLwl2D3M0MIYevlGMy0J4eMDImoL2FDw8YWynJFzsF
 49 |           5OE2NIXTDDdWV3wBbAi9QcjJ9EqMkZAT2PXmPpGYsqQDxguGbUMWXz1stdNP7eVOwWffAywhtglo
 50 |           KGJo6s5R2dYYU/KCzlGBXmCP5AuGfUPOMujzrUTMG9ZdMr5x7oi/nNbsQlHHsOcjf8Jz8sRlFlFz
 51 |           8N1KHfpCStXzLxOAX32gzR8ZqTqGqpZMwgF9JzlbDIJqPKORXF0dSQmi3YhfXSdvqGUWRZPjs4NQ
 52 |           RpsS7dg5Xo9uLIUzYnI29d9m3tIeJidf/I/8SBiDtaDN6oh2SP6tsojdT/avstOOe8OKMT6QwUwI
 53 |           Y5eExVw3bjh9xS0LVllOvsBYRxruP6+z9RztWu9XS6MmL5PfAAAA//8DAIQI5eENBAAA
 54 |       headers:
 55 |         CF-RAY:
 56 |           - 910ad9cd0d9dfae3-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Wed, 12 Feb 2025 07:26:30 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=TSiOYmPilz2y7Jm0I0xOnHulR5vDLiJjM_Tk_6ibsb0-1739345190-1.0.1.1-XaU3LvYSVCset.TzV8TpZunDbHgKU02_JUjyYrd1cn8K4eSx2UYKCGbZis4LZejgM5LMmHAkUcbIsTRTeXrgyQ;
 69 |             path=/; expires=Wed, 12-Feb-25 07:56:30 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=U0EwGnOG.JseWfrnCZ1q.Sl0s6BhsNoFqTwgRWuYAJs-1739345190935-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         cf-cache-status:
 82 |           - DYNAMIC
 83 |         openai-organization:
 84 |           - future-house-xr4tdh
 85 |         openai-processing-ms:
 86 |           - "905"
 87 |         openai-version:
 88 |           - "2020-10-01"
 89 |         strict-transport-security:
 90 |           - max-age=31536000; includeSubDomains; preload
 91 |         x-ratelimit-limit-requests:
 92 |           - "30000"
 93 |         x-ratelimit-limit-tokens:
 94 |           - "150000000"
 95 |         x-ratelimit-remaining-requests:
 96 |           - "29999"
 97 |         x-ratelimit-remaining-tokens:
 98 |           - "149999937"
 99 |         x-ratelimit-reset-requests:
100 |           - 2ms
101 |         x-ratelimit-reset-tokens:
102 |           - 0s
103 |         x-request-id:
104 |           - req_ca2b9465ba11da2901a8230e9fec93ba
105 |       status:
106 |         code: 200
107 |         message: OK
108 | version: 1
109 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/cassettes/TestTooling.test_empty_tools[OpenAI-no-tools].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "What does 42 mean?"}], "model":
  5 |         "gpt-4o-mini-2024-07-18", "max_tokens": 56, "n": 1, "temperature": 0.1}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "146"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.60.0
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.60.0
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.4
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAAwAAAP//jFNNb9swDL3nVxC69GIXcZI2bW5bC7Q7bd3HaRkMRaJtLrLkiFJao+h/
 45 |           L2yncYZ1wC4G9B758MhHP08ABGmxAqEqGVTdmPTjNHvQN/uHOcer28/hS/Z41377cfP1flfNdiLp
 46 |           OtzmN6rw1nWuXN0YDOTsQCuPMmCnmi3n1/PFRXad9UTtNJqurWxCunBpTZbS2XS2SKfLNLs6dFeO
 47 |           FLJYwc8JAMBz/+18Wo1PYgXT5A2pkVmWKFbHIgDhnekQIZmJg7RBJCOpnA1oe+vfKwQb6w16WMyA
 48 |           GApZu8imha11jxYkw1qECkFafkQPwUH3iiZQLQPCLiJ3M4MrwFCByUBb2qNnTEBaDbhH34aKbLkW
 49 |           QBZuXSyNZPigZc1nwIrQKoSCVK/E6Ak5gXVv7p6Cqiraoj9juIuk8c3DnTTyqT1fC/hke4CD820C
 50 |           EkrvYtM5qtoGfUo2oDFUog2wQbIlwyaS0QzydCsei8iyS8ZGYw74y3HNxpWNdxs+8Ee8IEtc5R4l
 51 |           O9ut1KAtQyV6/mUC8KsPNP6RkWi8q5uQB7dF20lm80FQjGc0kheXBzK4IM2IX14n76jlGoMkwycH
 52 |           IZRUFeqxc7weGTW5E2JyMvXfZt7THiYnW/6P/EgohU1AnTce9ZD8e2Ueu5/sX2XHHfeGBaPfk8I8
 53 |           EPouCY2FjGY4fcEtB6zzgmyJvvE03H/R5MsZ6qXcXCyUmLxMXgEAAP//AwCu/+jJDQQAAA==
 54 |       headers:
 55 |         CF-Cache-Status:
 56 |           - DYNAMIC
 57 |         CF-RAY:
 58 |           - 910ad9d41ce87ab2-SJC
 59 |         Connection:
 60 |           - keep-alive
 61 |         Content-Encoding:
 62 |           - gzip
 63 |         Content-Type:
 64 |           - application/json
 65 |         Date:
 66 |           - Wed, 12 Feb 2025 07:26:32 GMT
 67 |         Server:
 68 |           - cloudflare
 69 |         Set-Cookie:
 70 |           - __cf_bm=wgGARbubXUu4RCa7O7vqQbGRDDz7T2S6.0lDcAZaWZg-1739345192-1.0.1.1-gi4_gPOvtYOcQgL_U._xS5wMuwepL3zIP3VenwWVZZffP8ANs3vyVFM07I38bKIOXgSi83Bq4Ed8ZUwobaVejA;
 71 |             path=/; expires=Wed, 12-Feb-25 07:56:32 GMT; domain=.api.openai.com; HttpOnly;
 72 |             Secure; SameSite=None
 73 |           - _cfuvid=h0OafY1hscLy_jhACoWa4TkXDoRejaRg0hf_tOisUEU-1739345192160-0.0.1.1-604800000;
 74 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 75 |         Transfer-Encoding:
 76 |           - chunked
 77 |         X-Content-Type-Options:
 78 |           - nosniff
 79 |         access-control-expose-headers:
 80 |           - X-Request-ID
 81 |         alt-svc:
 82 |           - h3=":443"; ma=86400
 83 |         openai-organization:
 84 |           - future-house-xr4tdh
 85 |         openai-processing-ms:
 86 |           - "997"
 87 |         openai-version:
 88 |           - "2020-10-01"
 89 |         strict-transport-security:
 90 |           - max-age=31536000; includeSubDomains; preload
 91 |         x-ratelimit-limit-requests:
 92 |           - "30000"
 93 |         x-ratelimit-limit-tokens:
 94 |           - "150000000"
 95 |         x-ratelimit-remaining-requests:
 96 |           - "29999"
 97 |         x-ratelimit-remaining-tokens:
 98 |           - "149999937"
 99 |         x-ratelimit-reset-requests:
100 |           - 2ms
101 |         x-ratelimit-reset-tokens:
102 |           - 0s
103 |         x-request-id:
104 |           - req_0311ae3de81850199f4bfe95ab85a1e2
105 |       status:
106 |         code: 200
107 |         message: OK
108 | version: 1
109 | 


--------------------------------------------------------------------------------
/packages/lmi/tests/conftest.py:
--------------------------------------------------------------------------------
 1 | from __future__ import annotations
 2 | 
 3 | import logging
 4 | import shutil
 5 | from collections.abc import Iterator
 6 | from pathlib import Path
 7 | from typing import Any
 8 | 
 9 | import pytest
10 | from dotenv import load_dotenv
11 | 
12 | from lmi.utils import (
13 |     ANTHROPIC_API_KEY_HEADER,
14 |     CROSSREF_KEY_HEADER,
15 |     OPENAI_API_KEY_HEADER,
16 |     SEMANTIC_SCHOLAR_KEY_HEADER,
17 |     filter_api_keys,
18 | )
19 | 
20 | TESTS_DIR = Path(__file__).parent
21 | CASSETTES_DIR = TESTS_DIR / "cassettes"
22 | 
23 | 
24 | @pytest.fixture(autouse=True, scope="session")
25 | def _load_env() -> None:
26 |     load_dotenv()
27 | 
28 | 
29 | @pytest.fixture(scope="session", name="vcr_config")
30 | def fixture_vcr_config() -> dict[str, Any]:
31 |     return {
32 |         "filter_headers": [
33 |             CROSSREF_KEY_HEADER,
34 |             SEMANTIC_SCHOLAR_KEY_HEADER,
35 |             OPENAI_API_KEY_HEADER,
36 |             ANTHROPIC_API_KEY_HEADER,
37 |             "cookie",
38 |         ],
39 |         "before_record_request": filter_api_keys,
40 |         "record_mode": "once",
41 |         "allow_playback_repeats": True,
42 |         "cassette_library_dir": str(CASSETTES_DIR),
43 |     }
44 | 
45 | 
46 | @pytest.fixture
47 | def tmp_path_cleanup(tmp_path: Path) -> Iterator[Path]:
48 |     yield tmp_path
49 |     # Cleanup after the test
50 |     if tmp_path.exists():
51 |         shutil.rmtree(tmp_path, ignore_errors=True)
52 | 
53 | 
54 | @pytest.fixture(scope="session", name="stub_data_dir")
55 | def fixture_stub_data_dir() -> Path:
56 |     return Path(__file__).parent / "stub_data"
57 | 
58 | 
59 | @pytest.fixture(name="reset_log_levels")
60 | def fixture_reset_log_levels(caplog) -> Iterator[None]:
61 |     logging.getLogger().setLevel(logging.DEBUG)
62 | 
63 |     for name in logging.root.manager.loggerDict:
64 |         logger = logging.getLogger(name)
65 |         logger.setLevel(logging.DEBUG)
66 |         logger.propagate = True
67 | 
68 |     caplog.set_level(logging.DEBUG)
69 | 
70 |     yield
71 | 
72 |     for name in logging.root.manager.loggerDict:
73 |         logger = logging.getLogger(name)
74 |         logger.setLevel(logging.NOTSET)
75 |         logger.propagate = True
76 | 


--------------------------------------------------------------------------------
/src/ldp/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Future-House/ldp/2e9557233dc0e4c8abbb9f1f065059108a0dcfcd/src/ldp/__init__.py


--------------------------------------------------------------------------------
/src/ldp/agent/__init__.py:
--------------------------------------------------------------------------------
 1 | # Lower than LiteLLM's 10-min default: https://github.com/BerriAI/litellm/blob/v1.48.10/litellm/main.py#L859
 2 | DEFAULT_LLM_COMPLETION_TIMEOUT = 120  # seconds
 3 | 
 4 | # ruff: noqa: E402  # Avoid circular imports
 5 | 
 6 | from .agent import Agent, AgentConfig
 7 | from .agent_client import HTTPAgentClient, make_simple_agent_server
 8 | from .memory_agent import MemoryAgent
 9 | from .react_agent import ReActAgent
10 | from .simple_agent import NoToolsSimpleAgent, SimpleAgent, SimpleAgentState
11 | from .tree_of_thoughts_agent import TreeofThoughtsAgent
12 | 
13 | __all__ = [
14 |     "DEFAULT_LLM_COMPLETION_TIMEOUT",
15 |     "Agent",
16 |     "AgentConfig",
17 |     "HTTPAgentClient",
18 |     "MemoryAgent",
19 |     "NoToolsSimpleAgent",
20 |     "ReActAgent",
21 |     "SimpleAgent",
22 |     "SimpleAgentState",
23 |     "TreeofThoughtsAgent",
24 |     "make_simple_agent_server",
25 | ]
26 | 


--------------------------------------------------------------------------------
/src/ldp/alg/__init__.py:
--------------------------------------------------------------------------------
 1 | from .algorithms import (
 2 |     bulk_evaluate_consensus,
 3 |     compute_pass_at_k,
 4 |     evaluate_consensus,
 5 |     to_network,
 6 | )
 7 | from .beam_search import Beam, BeamSearchRollout
 8 | from .callbacks import (
 9 |     Callback,
10 |     ClearContextCallback,
11 |     ClearOptimizerBuffersCallback,
12 |     ComputeTrajectoryMetricsMixin,
13 |     LoggingCallback,
14 |     MeanMetricsCallback,
15 |     RolloutDebugDumpCallback,
16 |     StoreTrajectoriesCallback,
17 |     TrajectoryFileCallback,
18 |     TrajectoryMetricsCallback,
19 |     WandBLoggingCallback,
20 | )
21 | from .rollout import RolloutManager
22 | from .runners import (
23 |     Evaluator,
24 |     EvaluatorConfig,
25 |     OfflineTrainer,
26 |     OfflineTrainerConfig,
27 |     OnlineTrainer,
28 |     OnlineTrainerConfig,
29 | )
30 | from .tree_search import TEnvCloneFn, TreeSearchRollout
31 | 
32 | __all__ = [
33 |     "Beam",
34 |     "BeamSearchRollout",
35 |     "Callback",
36 |     "ClearContextCallback",
37 |     "ClearOptimizerBuffersCallback",
38 |     "ComputeTrajectoryMetricsMixin",
39 |     "Evaluator",
40 |     "EvaluatorConfig",
41 |     "LoggingCallback",
42 |     "MeanMetricsCallback",
43 |     "OfflineTrainer",
44 |     "OfflineTrainerConfig",
45 |     "OnlineTrainer",
46 |     "OnlineTrainerConfig",
47 |     "RolloutDebugDumpCallback",
48 |     "RolloutManager",
49 |     "StoreTrajectoriesCallback",
50 |     "TEnvCloneFn",
51 |     "TrajectoryFileCallback",
52 |     "TrajectoryMetricsCallback",
53 |     "TreeSearchRollout",
54 |     "WandBLoggingCallback",
55 |     "bulk_evaluate_consensus",
56 |     "compute_pass_at_k",
57 |     "evaluate_consensus",
58 |     "to_network",
59 | ]
60 | 


--------------------------------------------------------------------------------
/src/ldp/alg/datasets.py:
--------------------------------------------------------------------------------
 1 | from aviary.core import TASK_DATASET_REGISTRY
 2 | from aviary.core import DummyTaskDataset as _DummyTaskDataset
 3 | 
 4 | from .callbacks import ComputeTrajectoryMetricsMixin
 5 | 
 6 | 
 7 | class DummyTaskDataset(_DummyTaskDataset, ComputeTrajectoryMetricsMixin):
 8 |     pass
 9 | 
10 | 
11 | TASK_DATASET_REGISTRY["dummy"] = "ldp.alg.datasets", "DummyTaskDataset"
12 | 


--------------------------------------------------------------------------------
/src/ldp/alg/optimizer/__init__.py:
--------------------------------------------------------------------------------
 1 | from typing import Any, cast
 2 | 
 3 | from pydantic import BaseModel, ConfigDict, Field
 4 | 
 5 | from ldp.agent import Agent, MemoryAgent, ReActAgent
 6 | from ldp.alg.optimizer.ape import APEOpt, APEScoreFn
 7 | from ldp.alg.optimizer.memory import MemoryFactory, MemoryOpt, PositiveMemoryOpt
 8 | from ldp.alg.optimizer.opt import _OPTIMIZER_REGISTRY, ChainedOptimizer, Optimizer
 9 | 
10 | _DEFAULT_OPTIMIZER_ERROR_MSG = (
11 |     "Didn't yet implement an optimizer of type {opt_type} for {agent_type}."
12 | )
13 | AUTOSELECT_BEST_OPTIMIZER = None
14 | 
15 | 
16 | class OptimizerConfig(BaseModel):
17 |     model_config = ConfigDict(extra="forbid")
18 | 
19 |     optimizer_type: str | None = AUTOSELECT_BEST_OPTIMIZER
20 |     optimizer_kwargs: dict[str, Any] = Field(default_factory=dict)
21 | 
22 | 
23 | _DEFAULT_OPTIMIZER_MAP: dict[type[Agent], type[Optimizer]] = {
24 |     MemoryAgent: MemoryOpt,
25 |     ReActAgent: APEOpt,
26 | }
27 | 
28 | 
29 | def default_optimizer_factory(
30 |     agent: Agent,
31 |     optimizer_cls: str | type[Optimizer] | None = AUTOSELECT_BEST_OPTIMIZER,
32 |     **optimizer_kwargs,
33 | ) -> Optimizer:
34 |     """A method that constructs a default optimizer for commonly-used agents.
35 | 
36 |     Args:
37 |         agent: Agent to construct the optimizer for.
38 |         optimizer_cls: The optimizer class to use. If not specified, we will try a
39 |             default based on the provided agent.
40 |         optimizer_kwargs: Arguments forwarded to optimizer_cls.
41 | 
42 |     Returns:
43 |         Instantiated optimizer.
44 |     """
45 |     if isinstance(optimizer_cls, str):
46 |         try:
47 |             optimizer_cls = _OPTIMIZER_REGISTRY[optimizer_cls]
48 |         except KeyError:
49 |             raise TypeError(
50 |                 "Optimizer class not supported by default_optimizer_factory:"
51 |                 f" {optimizer_cls}"
52 |             ) from None
53 | 
54 |     if optimizer_cls is None:
55 |         optimizer_cls = _DEFAULT_OPTIMIZER_MAP.get(agent.__class__)
56 | 
57 |     # convince mypy that optimizer_cls is a type from here on
58 |     optimizer_cls = cast("type", optimizer_cls)
59 | 
60 |     if isinstance(agent, MemoryAgent):
61 |         if optimizer_cls != MemoryOpt:
62 |             raise NotImplementedError(
63 |                 _DEFAULT_OPTIMIZER_ERROR_MSG.format(
64 |                     opt_type=optimizer_cls.__name__, agent_type=MemoryAgent.__name__
65 |                 )
66 |             )
67 |         return MemoryOpt.from_agent(agent, **optimizer_kwargs)
68 |     if isinstance(agent, ReActAgent):
69 |         if optimizer_cls != APEOpt:
70 |             raise NotImplementedError(
71 |                 _DEFAULT_OPTIMIZER_ERROR_MSG.format(
72 |                     opt_type=optimizer_cls.__name__, agent_type=ReActAgent.__name__
73 |                 )
74 |             )
75 |         return APEOpt.from_agent(agent, **optimizer_kwargs)
76 |     raise TypeError(f"Unsupported agent type: {agent.__class__.__name__}")
77 | 
78 | 
79 | __all__ = [
80 |     "APEOpt",
81 |     "APEScoreFn",
82 |     "ChainedOptimizer",
83 |     "MemoryFactory",
84 |     "MemoryOpt",
85 |     "Optimizer",
86 |     "OptimizerConfig",
87 |     "PositiveMemoryOpt",
88 |     "default_optimizer_factory",
89 | ]
90 | 


--------------------------------------------------------------------------------
/src/ldp/alg/optimizer/opt.py:
--------------------------------------------------------------------------------
 1 | from __future__ import annotations
 2 | 
 3 | import logging
 4 | from abc import ABC, abstractmethod
 5 | from collections.abc import Iterable
 6 | 
 7 | from ldp.data_structures import Trajectory
 8 | from ldp.shims import tqdm
 9 | 
10 | logger = logging.getLogger(__name__)
11 | 
12 | 
13 | # Registry for all optimizers
14 | _OPTIMIZER_REGISTRY: dict[str, type[Optimizer]] = {}
15 | 
16 | 
17 | class Optimizer(ABC):
18 |     """Base class for all optimizers."""
19 | 
20 |     def __init_subclass__(cls) -> None:
21 |         # Register each optimizer subclass
22 |         _OPTIMIZER_REGISTRY[cls.__name__] = cls
23 |         return super().__init_subclass__()
24 | 
25 |     def aggregate(
26 |         self, trajectories: Iterable[Trajectory], show_pbar: bool = False, **kwargs
27 |     ) -> None:
28 |         """Aggregate trajectories to construct training samples."""
29 |         trajectories_with_pbar = tqdm(
30 |             trajectories,
31 |             desc="Aggregating trajectories",
32 |             ncols=0,
33 |             mininterval=1,
34 |             disable=not show_pbar,
35 |         )
36 |         for trajectory in trajectories_with_pbar:
37 |             self.aggregate_trajectory(trajectory, **kwargs)
38 | 
39 |     @abstractmethod
40 |     def aggregate_trajectory(self, trajectory: Trajectory) -> None:
41 |         """Aggregate transitions from a single trajectory to construct training samples."""
42 | 
43 |     @abstractmethod
44 |     async def update(self) -> None:
45 |         """Update the model based on the aggregated samples."""
46 | 
47 | 
48 | class ChainedOptimizer(Optimizer):
49 |     """An optimizer that runs a sequence of sub-optimizers in the order they are provided."""
50 | 
51 |     def __init__(self, *optimizers: Optimizer):
52 |         self.optimizers = optimizers
53 | 
54 |     def aggregate(
55 |         self, trajectories: Iterable[Trajectory], show_pbar: bool = False, **kwargs
56 |     ) -> None:
57 |         for optimizer in self.optimizers:
58 |             optimizer.aggregate(trajectories, show_pbar=show_pbar, **kwargs)
59 | 
60 |     async def update(self) -> None:
61 |         for optimizer in self.optimizers:
62 |             await optimizer.update()
63 | 


--------------------------------------------------------------------------------
/src/ldp/graph/__init__.py:
--------------------------------------------------------------------------------
 1 | from .common_ops import (
 2 |     ConfigOp,
 3 |     EmbeddingOp,
 4 |     FxnOp,
 5 |     IdentityOp,
 6 |     LLMCallOp,
 7 |     MemoryOp,
 8 |     PromptOp,
 9 | )
10 | from .loss_ops import MSELossOp
11 | from .memory import Memory, MemoryModel
12 | from .op_utils import (
13 |     CallID,
14 |     compute_graph,
15 |     eval_mode,
16 |     get_call_id,
17 |     get_run_id,
18 |     get_training_mode,
19 |     op_call,
20 |     set_training_mode,
21 |     train_mode,
22 | )
23 | from .ops import Op, OpCtx, OpResult
24 | 
25 | __all__ = [
26 |     "CallID",
27 |     "ConfigOp",
28 |     "EmbeddingOp",
29 |     "FxnOp",
30 |     "IdentityOp",
31 |     "LLMCallOp",
32 |     "MSELossOp",
33 |     "Memory",
34 |     "MemoryModel",
35 |     "MemoryOp",
36 |     "Op",
37 |     "OpCtx",
38 |     "OpResult",
39 |     "PromptOp",
40 |     "compute_graph",
41 |     "eval_mode",
42 |     "get_call_id",
43 |     "get_run_id",
44 |     "get_training_mode",
45 |     "op_call",
46 |     "set_training_mode",
47 |     "train_mode",
48 | ]
49 | 


--------------------------------------------------------------------------------
/src/ldp/graph/loss_ops.py:
--------------------------------------------------------------------------------
 1 | """This module contains loss Op implementations."""
 2 | 
 3 | from typing import TYPE_CHECKING
 4 | 
 5 | from .op_utils import CallID
 6 | from .ops import GradInType, Op, OpCtx
 7 | 
 8 | if TYPE_CHECKING:
 9 |     import numpy.typing as npt
10 |     import torch
11 |     import tree
12 | 
13 | 
14 | class MSELossOp(Op):
15 |     async def forward(
16 |         self,
17 |         prediction: "npt.NDArray | torch.Tensor",
18 |         target: "npt.NDArray | torch.Tensor",
19 |     ) -> "float | torch.Tensor":
20 |         return ((prediction - target) ** 2).mean()
21 | 
22 |     @classmethod
23 |     def backward(
24 |         cls,
25 |         ctx: OpCtx,
26 |         input_args,
27 |         input_kwargs,
28 |         grad_output: "tree.Structure",
29 |         call_id: CallID,
30 |     ) -> GradInType:
31 |         prediction = input_kwargs["prediction"]
32 |         target = input_kwargs["target"]
33 |         grad = 2 * (prediction - target)
34 |         return [], {"prediction": grad, "target": None}
35 | 


--------------------------------------------------------------------------------
/src/ldp/graph/modules/__init__.py:
--------------------------------------------------------------------------------
 1 | """
 2 | A module is a subgraph of a compute graph that can be exposed like a single node/op.
 3 | 
 4 | An analogous entity in PyTorch is torch.nn.Module.
 5 | """
 6 | 
 7 | from .llm_call import ParsedLLMCallModule
 8 | from .react import (
 9 |     ReActModule,
10 |     ReActModuleSinglePrompt,
11 |     ToolDescriptionMethods,
12 |     parse_message,
13 | )
14 | from .reflect import ReflectModule, ReflectModuleConfig
15 | from .thought import ThoughtModule
16 | 
17 | __all__ = [
18 |     "ParsedLLMCallModule",
19 |     "ReActModule",
20 |     "ReActModuleSinglePrompt",
21 |     "ReflectModule",
22 |     "ReflectModuleConfig",
23 |     "ThoughtModule",
24 |     "ToolDescriptionMethods",
25 |     "parse_message",
26 | ]
27 | 


--------------------------------------------------------------------------------
/src/ldp/graph/modules/llm_call.py:
--------------------------------------------------------------------------------
 1 | from collections.abc import Callable, Iterable
 2 | from typing import Any, Generic, TypeVar
 3 | 
 4 | from aviary.core import Message
 5 | 
 6 | from ldp.graph import ConfigOp, FxnOp, LLMCallOp, OpResult, compute_graph
 7 | 
 8 | TParsedMessage = TypeVar("TParsedMessage", bound=Message)
 9 | 
10 | 
11 | class ParsedLLMCallModule(Generic[TParsedMessage]):
12 |     """Module for a processing-based tool selection, with a learnable configuration."""
13 | 
14 |     def __init__(
15 |         self, llm_model: dict[str, Any], parser: Callable[..., TParsedMessage]
16 |     ):
17 |         self.config_op = ConfigOp[dict](config=llm_model)
18 |         self.llm_call_op = LLMCallOp()
19 |         self.parse_msg_op = FxnOp(parser)
20 | 
21 |     @compute_graph()
22 |     async def __call__(
23 |         self, messages: Iterable[Message], *parse_args, **parse_kwargs
24 |     ) -> tuple[OpResult[TParsedMessage], Message]:
25 |         raw_result = await self.llm_call_op(await self.config_op(), msgs=messages)
26 |         return (
27 |             await self.parse_msg_op(raw_result, *parse_args, **parse_kwargs),
28 |             raw_result.value,
29 |         )
30 | 


--------------------------------------------------------------------------------
/src/ldp/graph/modules/reflect.py:
--------------------------------------------------------------------------------
 1 | from typing import Any
 2 | 
 3 | from aviary.core import Message
 4 | from pydantic import BaseModel, Field
 5 | 
 6 | from ldp.graph import ConfigOp, FxnOp, LLMCallOp, PromptOp, compute_graph
 7 | from ldp.graph.ops import ResultOrValue
 8 | from ldp.llms import append_to_sys, indent_xml
 9 | 
10 | 
11 | class ReflectModuleConfig(BaseModel):
12 |     """Configuration for the ReflectModuleConfig."""
13 | 
14 |     llm_model: dict[str, Any] = Field(
15 |         default={"name": "gpt-3.5-turbo"},
16 |         description="Starting configuration for the LLM model.",
17 |     )
18 | 
19 | 
20 | class ReflectModule:
21 |     """A module that simply gives an LLM to reflect on an input."""
22 | 
23 |     def __init__(self, start_config: ReflectModuleConfig):
24 |         self.llm_call_op = LLMCallOp()
25 |         self.prompt_op = PromptOp(
26 |             "Consider a proposed response based on context. Reflect on the response"
27 |             " within <thought> tags then conclude with a possibly revised response"
28 |             " within <final-response> tags."
29 |         )
30 |         self.config_op = ConfigOp[ReflectModuleConfig](config=start_config)
31 |         self.llm_config_op = FxnOp[dict](lambda c: c.llm_model)
32 |         self.package_fxn = FxnOp(append_to_sys)
33 | 
34 |         def extract_msg(msg: Message, backup_response: str) -> str:
35 |             msg_str = msg.content
36 |             if msg_str and "<final-response>" in msg_str:
37 |                 return msg_str.split("<final-response>")[1].split("</final-response>")[
38 |                     0
39 |                 ]
40 |             if msg_str and "<response>" in msg_str:
41 |                 return msg_str.split("<response>")[1].split("</response>")[0]
42 |             return backup_response
43 | 
44 |         self.extract_msg = FxnOp(extract_msg)
45 | 
46 |     @compute_graph()
47 |     async def __call__(
48 |         self, context: ResultOrValue[str], response: ResultOrValue[str]
49 |     ) -> ResultOrValue[str]:
50 |         llm_config = await self.llm_config_op(await self.config_op())
51 |         sys_str = await self.prompt_op()
52 |         user_str = indent_xml(
53 |             f"<context>{context}</context><response>{response}</response>"
54 |         )
55 |         msg = await self.package_fxn(user_str, sys_str)
56 |         llm_result = await self.llm_call_op(llm_config, msg)
57 |         return await self.extract_msg(llm_result, response)
58 | 


--------------------------------------------------------------------------------
/src/ldp/graph/modules/thought.py:
--------------------------------------------------------------------------------
 1 | from collections.abc import Iterable, Mapping
 2 | from typing import Any
 3 | 
 4 | from aviary.core import Message, ToolRequestMessage
 5 | 
 6 | from ldp.graph import FxnOp, OpResult, PromptOp, compute_graph
 7 | from ldp.llms import prepend_sys_and_append_sys
 8 | 
 9 | from .llm_call import ParsedLLMCallModule
10 | 
11 | 
12 | class ThoughtModule:
13 |     @staticmethod
14 |     def _downcast_to_message(message: Message | ToolRequestMessage) -> Message:
15 |         if isinstance(message, ToolRequestMessage):
16 |             # Downcast into a normal Message if the LLM tried to call tools
17 |             return Message(role=message.role, content=message.content)
18 |         return message
19 | 
20 |     def __init__(
21 |         self, llm_model: dict[str, Any], first_sys_prompt: str, second_sys_prompt: str
22 |     ):
23 |         self.first_sys_prompt_op = PromptOp(first_sys_prompt)
24 |         self.second_sys_prompt_op = PromptOp(second_sys_prompt)
25 |         self.package_msg_op = FxnOp(prepend_sys_and_append_sys)
26 |         self.llm_call = ParsedLLMCallModule[Message](
27 |             llm_model, parser=self._downcast_to_message
28 |         )
29 | 
30 |     @compute_graph()
31 |     async def __call__(
32 |         self,
33 |         messages: Iterable[Message],
34 |         first_prompt_kwargs: Mapping[str, Any],
35 |         second_prompt_kwargs: Mapping[str, Any],
36 |     ) -> OpResult[Message]:
37 |         packaged_msgs = await self.package_msg_op(
38 |             messages,
39 |             initial_sys_content=await self.first_sys_prompt_op(**first_prompt_kwargs),
40 |             final_sys_content=await self.second_sys_prompt_op(**second_prompt_kwargs),
41 |         )
42 |         return (await self.llm_call(packaged_msgs))[0]  # type: ignore[arg-type]
43 | 


--------------------------------------------------------------------------------
/src/ldp/llms/__init__.py:
--------------------------------------------------------------------------------
 1 | from lmi import LiteLLMModel as LLMModel
 2 | from lmi import (
 3 |     LLMResult,
 4 |     sum_logprobs,
 5 |     validate_json_completion,
 6 | )
 7 | from lmi.embeddings import (
 8 |     EmbeddingModel,
 9 |     EmbeddingModes,
10 |     HybridEmbeddingModel,
11 |     LiteLLMEmbeddingModel,
12 |     SparseEmbeddingModel,
13 | )
14 | from lmi.exceptions import (
15 |     JSONSchemaValidationError,
16 | )
17 | 
18 | from .prompts import (
19 |     append_to_messages,
20 |     append_to_sys,
21 |     indent_xml,
22 |     prepend_sys,
23 |     prepend_sys_and_append_sys,
24 | )
25 | 
26 | __all__ = [
27 |     "EmbeddingModel",
28 |     "EmbeddingModes",
29 |     "HybridEmbeddingModel",
30 |     "JSONSchemaValidationError",
31 |     "LLMModel",
32 |     "LLMResult",
33 |     "LiteLLMEmbeddingModel",
34 |     "SparseEmbeddingModel",
35 |     "append_to_messages",
36 |     "append_to_sys",
37 |     "indent_xml",
38 |     "prepend_sys",
39 |     "prepend_sys_and_append_sys",
40 |     "sum_logprobs",
41 |     "validate_json_completion",
42 | ]
43 | 


--------------------------------------------------------------------------------
/src/ldp/llms/prompts.py:
--------------------------------------------------------------------------------
  1 | """This module provides utility functions for appending and prepending system messages."""
  2 | 
  3 | from collections.abc import Collection, Iterable
  4 | 
  5 | from aviary.core import Message
  6 | 
  7 | 
  8 | def append_to_messages(messages: list[Message], new_message: Message) -> list[Message]:
  9 |     """Appends a message to a list of messages, returning that in-place modified list.
 10 | 
 11 |     Examples:
 12 |         >>> messages = [Message(content="Hello")]
 13 |         >>> modified_messages = append_to_messages(messages, Message(content="New"))
 14 |         >>> modified_messages
 15 |         [Message(role='user', content='Hello'), Message(role='user', content='New')]
 16 |         >>> id(messages) == id(modified_messages)
 17 |         True
 18 |     """
 19 |     messages.append(new_message)
 20 |     return messages
 21 | 
 22 | 
 23 | def append_to_sys(user_content: str, sys_content: str | None = None) -> list[Message]:
 24 |     """Appends a user message to a list of messages, optionally including a system message.
 25 | 
 26 |     Args:
 27 |         user_content: The content of the user message.
 28 |         sys_content: Optional content for the system message. Defaults to None.
 29 | 
 30 |     Returns:
 31 |         A list of messages including the optional system message and the user message.
 32 | 
 33 |     Examples:
 34 |         >>> append_to_sys("Hello, world!")
 35 |         [Message(role='user', content='Hello, world!')]
 36 | 
 37 |         >>> append_to_sys("Hello, world!", "System initialized.")
 38 |         [Message(role='system', content='System initialized.'), Message(role='user', content='Hello, world!')]
 39 |     """
 40 |     sys = [Message(role="system", content=sys_content)] if sys_content else []
 41 |     return [*sys, Message(content=user_content)]
 42 | 
 43 | 
 44 | def prepend_sys(messages: Collection, sys_content: str) -> list[Message]:
 45 |     """Prepends a system message to a list of messages.
 46 | 
 47 |     Args:
 48 |         messages: The list of existing messages.
 49 |         sys_content: The content of the system message to be prepended.
 50 | 
 51 |     Returns:
 52 |         A new list of messages with the system message prepended.
 53 | 
 54 |     Examples:
 55 |         >>> messages = [Message(role="user", content="Hello!")]
 56 |         >>> prepend_sys(messages, "System initialized.")
 57 |         [Message(role='system', content='System initialized.'), Message(role='user', content='Hello!')]
 58 |     """
 59 |     return [Message(role="system", content=sys_content), *messages]
 60 | 
 61 | 
 62 | def indent_xml(xml_string, indent_size=2):
 63 |     output = []
 64 |     indent_level = 0
 65 | 
 66 |     # Split the input XML into parts by tags
 67 |     parts = xml_string.replace(">", ">\n").replace("<", "\n<").split("\n")
 68 |     parts = [part for part in parts if part.strip()]  # Remove empty parts
 69 | 
 70 |     for part in parts:
 71 |         if part.startswith("</"):
 72 |             # Closing tag, decrease indent
 73 |             indent_level -= indent_size
 74 |             output.append(" " * indent_level + part)
 75 |         elif part.startswith("<") and not part.endswith("/>") and ">" in part:
 76 |             # Opening tag, maintain then increase indent
 77 |             output.append(" " * indent_level + part)
 78 |             indent_level += indent_size
 79 |         elif part.endswith("/>"):
 80 |             # Self-closing tag, just append
 81 |             output.append(" " * indent_level + part)
 82 |         else:
 83 |             # Text or other data, maintain current indent
 84 |             # Handle multiple lines within text nodes
 85 |             text_lines = part.split("\n")
 86 |             output.extend([
 87 |                 " " * indent_level + line.strip() for line in text_lines if line.strip()
 88 |             ])
 89 | 
 90 |     return "\n".join(output)
 91 | 
 92 | 
 93 | def prepend_sys_and_append_sys(
 94 |     messages: Iterable[Message], initial_sys_content: str, final_sys_content: str
 95 | ) -> list[Message]:
 96 |     return [
 97 |         Message(role="system", content=initial_sys_content),
 98 |         *messages,
 99 |         Message(role="system", content=final_sys_content),
100 |     ]
101 | 


--------------------------------------------------------------------------------
/src/ldp/main.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | import asyncio
 3 | import pickle
 4 | from contextlib import suppress
 5 | from os import PathLike
 6 | from pathlib import Path
 7 | 
 8 | from aviary.core import Environment
 9 | 
10 | from ldp.agent import Agent
11 | from ldp.alg.callbacks import TerminalPrintingCallback
12 | from ldp.alg.rollout import RolloutManager
13 | 
14 | 
15 | def get_or_make_agent(agent: Agent | str | PathLike) -> Agent:
16 |     if isinstance(agent, Agent):
17 |         return agent
18 | 
19 |     if isinstance(agent, str):
20 |         with suppress(KeyError):
21 |             return Agent.from_name(agent)
22 | 
23 |     path = Path(agent)
24 |     if not path.exists():
25 |         raise ValueError(f"Could not resolve agent: {agent}")
26 | 
27 |     with path.open("rb") as f:
28 |         return pickle.load(f)  # noqa: S301
29 | 
30 | 
31 | def get_or_make_environment(environment: Environment | str, task: str) -> Environment:
32 |     if isinstance(environment, Environment):
33 |         return environment
34 | 
35 |     if isinstance(environment, str):
36 |         with suppress(KeyError):
37 |             return Environment.from_name(environment, task=task)
38 | 
39 |     raise ValueError(
40 |         f"Could not resolve environment: {environment}. Available environments:"
41 |         f" {Environment.available()}"
42 |     )
43 | 
44 | 
45 | async def main(
46 |     task: str,
47 |     environment: Environment | str,
48 |     agent: Agent | str | PathLike = "SimpleAgent",
49 | ):
50 |     agent = get_or_make_agent(agent)
51 | 
52 |     callback = TerminalPrintingCallback()
53 |     rollout_manager = RolloutManager(agent=agent, callbacks=[callback])
54 | 
55 |     _ = await rollout_manager.sample_trajectories(
56 |         environment_factory=lambda: get_or_make_environment(environment, task)
57 |     )
58 | 
59 | 
60 | if __name__ == "__main__":
61 |     parser = argparse.ArgumentParser()
62 |     parser.add_argument("task", help="Task to prompt environment with.")
63 |     parser.add_argument(
64 |         "--env", required=True, help="Environment to sample trajectories from."
65 |     )
66 |     parser.add_argument(
67 |         "--agent", default="SimpleAgent", help="Agent to sample trajectories with."
68 |     )
69 |     args = parser.parse_args()
70 | 
71 |     asyncio.run(main(args.task, args.env, args.agent))
72 | 


--------------------------------------------------------------------------------
/src/ldp/nn/__init__.py:
--------------------------------------------------------------------------------
 1 | from ldp.nn.handlers.chunking import TensorChunker
 2 | 
 3 | from .agent.simple_local_agent import AgentLMConfig, SimpleLocalLLMAgent
 4 | from .graph.llm_call_op import LocalLLMCallOp
 5 | from .handlers.transformer_handler import (
 6 |     AsyncTransformer,
 7 |     AsyncTransformerInterface,
 8 |     ExecutionMode,
 9 |     LMType,
10 |     ParallelAsyncTransformer,
11 |     ParallelModeConfig,
12 |     ParallelTransformerHandler,
13 |     TransformerHandler,
14 |     TransformerHandlerConfig,
15 |     collate_fn_transformer_left_pad,
16 |     collate_fn_transformer_right_pad,
17 |     decollate_fn_transformer_decoder,
18 | )
19 | from .lm_config import LMConfig, TorchDType
20 | from .utils import set_seed
21 | 
22 | __all__ = [
23 |     "AgentLMConfig",
24 |     "AsyncTransformer",
25 |     "AsyncTransformerInterface",
26 |     "ExecutionMode",
27 |     "LMConfig",
28 |     "LMType",
29 |     "LocalLLMCallOp",
30 |     "ParallelAsyncTransformer",
31 |     "ParallelModeConfig",
32 |     "ParallelTransformerHandler",
33 |     "SimpleLocalLLMAgent",
34 |     "TensorChunker",
35 |     "TorchDType",
36 |     "TransformerHandler",
37 |     "TransformerHandlerConfig",
38 |     "collate_fn_transformer_left_pad",
39 |     "collate_fn_transformer_right_pad",
40 |     "decollate_fn_transformer_decoder",
41 |     "set_seed",
42 | ]
43 | 


--------------------------------------------------------------------------------
/src/ldp/nn/chat_templates/README.md:
--------------------------------------------------------------------------------
1 | - llama3.1_chat_template_vllm.jinja: https://github.com/vllm-project/vllm/blob/4fb8e329fd6f51d576bcf4b7e8907e0d83c4b5cf/examples/tool_chat_template_llama3.1_json.jinja
2 | - llama3.1_chat_template_hf.jinja: https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct/blob/main/tokenizer_config.json#L2053
3 | - llama3.1_chat_template_thought.jinja: Fixes a typo in llama3.1_chat_template_ori.jinja
4 | - llama3.1_chat_template_nothought.jinja: Derived from llama3.1_chat_template_ori.jinja, but removes thoughts
5 | - llama\*ori.jinja: TODOC - these were written by @kwanUm
6 | 


--------------------------------------------------------------------------------
/src/ldp/nn/chat_templates/llama2_chat_template_ori.jinja:
--------------------------------------------------------------------------------
 1 | {% if messages[0]['role'] == 'system' %}
 2 |     {% set loop_messages = messages[1:] %}
 3 |     {% set system_message = messages[0]['content'] %}
 4 | {% else %}
 5 |     {% set loop_messages = messages %}
 6 |     {% set system_message = false %}
 7 | {% endif %}
 8 | {% for message in loop_messages %}
 9 |     {% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}
10 |         {{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}
11 |     {% endif %}
12 |     {% if loop.index0 == 0 and system_message != false %}
13 |         {% set content = '<<SYS>>\\n' + system_message + '\\n<</SYS>>\\n\\n' + message['content'] %}
14 |     {% else %}
15 |         {% set content = message['content'] %}
16 |     {% endif %}
17 |     {% if message['role'] == 'user' %}
18 |         {{ bos_token + '[INST] ' + content.strip() + ' [/INST]' }}
19 |     {% elif message['role'] == 'assistant' %}
20 |         {% generation %}{{ ' '  + content.strip() + ' ' + eos_token }}{% endgeneration %}
21 |     {% endif %}
22 | {% endfor %}
23 | 


--------------------------------------------------------------------------------
/src/ldp/nn/generation/__init__.py:
--------------------------------------------------------------------------------
1 | from .base import LogitsProcessorWithFinalize
2 | 
3 | __all__ = [
4 |     "LogitsProcessorWithFinalize",
5 | ]
6 | 


--------------------------------------------------------------------------------
/src/ldp/nn/generation/base.py:
--------------------------------------------------------------------------------
 1 | from abc import ABC, abstractmethod
 2 | 
 3 | import torch
 4 | from transformers import LogitsProcessor
 5 | 
 6 | 
 7 | class LogitsProcessorWithFinalize(LogitsProcessor, ABC):
 8 |     @abstractmethod
 9 |     def finalize(self, token_ids: torch.Tensor) -> None:
10 |         """A method for subclasses to inject arbitrary finalization logic after sampling finishes.
11 | 
12 |         TransformerHandler will invoke logit_processor.finalize(token_ids), where token_ids are
13 |         the sampled tokens.
14 |         """
15 | 


--------------------------------------------------------------------------------
/src/ldp/nn/utils.py:
--------------------------------------------------------------------------------
 1 | import random
 2 | from pathlib import Path
 3 | 
 4 | import numpy as np
 5 | import torch
 6 | 
 7 | 
 8 | def set_seed(seed: int | None) -> None:
 9 |     if seed is None:
10 |         return
11 | 
12 |     random.seed(seed)
13 |     np.random.seed(seed)  # noqa: NPY002
14 |     torch.manual_seed(seed)
15 |     torch.cuda.manual_seed(seed)
16 | 
17 | 
18 | REPO_ROOT = Path(__file__).parent.parent.parent
19 | 


--------------------------------------------------------------------------------
/src/ldp/py.typed:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Future-House/ldp/2e9557233dc0e4c8abbb9f1f065059108a0dcfcd/src/ldp/py.typed


--------------------------------------------------------------------------------
/src/ldp/shims.py:
--------------------------------------------------------------------------------
 1 | __all__ = ["tqdm", "trange"]
 2 | 
 3 | import logging
 4 | import os
 5 | 
 6 | from tqdm import tqdm, trange
 7 | 
 8 | logger = logging.getLogger(__name__)
 9 | 
10 | if os.environ.get("LDP_TQDM_USE_RICH", "").lower() in {"1", "true", "yes"}:
11 |     # TODO: remove after https://github.com/tqdm/tqdm/issues/1618
12 |     try:
13 |         # pylint: disable-next=reimported
14 |         from tqdm.rich import tqdm, trange  # type: ignore[no-redef]
15 |     except ModuleNotFoundError:
16 |         logger.warning(
17 |             "User opted into rich progress via the environment variable"
18 |             " LDP_TQDM_USE_RICH, but did not have 'rich' installed."
19 |             " Please run `pip install ldp[rich]`.",
20 |             exc_info=True,
21 |         )
22 | 


--------------------------------------------------------------------------------
/src/ldp/utils.py:
--------------------------------------------------------------------------------
  1 | import logging
  2 | import logging.config
  3 | from typing import Any
  4 | 
  5 | logger = logging.getLogger(__name__)
  6 | 
  7 | 
  8 | def configure_stdout_logs(
  9 |     name: str = "root",
 10 |     level: int | str = logging.INFO,
 11 |     fmt: str = "%(asctime)s - %(name)s - %(levelname)s - %(message)s",
 12 | ) -> None:
 13 |     """Configure root logger to log to stdout.
 14 | 
 15 |     Args:
 16 |         name: Optional logger name, if unspecified the 'root' logger is configured.
 17 |         level: Log level to be emitted to stdout.
 18 |         fmt: Optional format string.
 19 |     """
 20 |     config: dict[str, Any] = {name: {"level": level, "handlers": ["stdout"]}}
 21 |     if name != "root":  # Non-root loggers need to be in a "loggers" key
 22 |         config["loggers"] = config
 23 |     logging.config.dictConfig(
 24 |         {
 25 |             "version": 1,
 26 |             "disable_existing_loggers": False,
 27 |             "formatters": {"standard": {"format": fmt}},
 28 |             "handlers": {
 29 |                 "stdout": {
 30 |                     "level": "INFO",
 31 |                     "formatter": "standard",
 32 |                     "class": "logging.StreamHandler",
 33 |                     "stream": "ext://sys.stdout",
 34 |                 },
 35 |             },
 36 |         }
 37 |         | config
 38 |     )
 39 | 
 40 | 
 41 | def discounted_returns(
 42 |     rewards: list[float], terminated: list[bool], discount: float = 1.0
 43 | ) -> list[float]:
 44 |     r"""
 45 |     Calculate the discounted returns for a list of rewards, considering termination flags and a discount factor.
 46 | 
 47 |     The discounted return represents the future discounted rewards from each time step onwards, taking into account
 48 |     whether an episode has terminated at each step.
 49 | 
 50 |     The discounted return \( G_t \) is given by:
 51 | 
 52 |     .. math::
 53 |         G_t = \sum_{k=1}^{\infty} \gamma^{k-1} R_{t+k}
 54 | 
 55 |         where:
 56 |         - \( G_t \) is the discounted return starting from time step \( t \).
 57 |         - \( \gamma \) is the discount factor.
 58 |         - \( R_{t+k} \) is the reward received at time step \( t+k \).
 59 | 
 60 |     NOTE: this could live in ldp.alg, but it's here to avoid circular imports.
 61 | 
 62 |     Args:
 63 |         rewards: A list of rewards at each time step.
 64 |         terminated: A list of boolean flags indicating whether the episode terminated at each time step.
 65 |         discount: Discount factor to apply to future rewards. Defaults to 1.0 which means no discounting is applied.
 66 | 
 67 |     Returns:
 68 |         A list of discounted returns (rewards to go), with each element representing the
 69 |             total discounted reward from that step onwards.
 70 | 
 71 |     Example:
 72 |         >>> rewards = [1.0, 2.0, 3.0]
 73 |         >>> terminated = [False, False, True]
 74 |         >>> discounted_returns(rewards, terminated, discount=0.9)
 75 |         [5.23, 4.7, 3.0]
 76 |     """
 77 |     returns = []
 78 |     r = 0.0
 79 |     for reward, term in zip(reversed(rewards), reversed(terminated), strict=False):
 80 |         # 1 - term is 0 if the episode has terminated
 81 |         r = reward + discount * r * (1 - term)
 82 |         returns.append(r)
 83 |     returns.reverse()
 84 |     return returns
 85 | 
 86 | 
 87 | def format_error_details(error: Exception) -> str:
 88 |     """Format detailed error information from an exception.
 89 | 
 90 |     Specially handles HTTP errors that have response attributes with status codes
 91 |     and JSON details, but works with any exception type.
 92 | 
 93 |     Args:
 94 |         error: The exception to format
 95 | 
 96 |     Returns:
 97 |         A formatted error string with available details
 98 |     """
 99 |     error_details = f"{error!s}"
100 | 
101 |     if hasattr(error, "response"):
102 |         error_details += f"\nStatus code: {error.response.status_code}"
103 |         try:
104 |             response_data = error.response.json()
105 |             if "detail" in response_data:
106 |                 error_details += "\nServer Traceback:\n"
107 |                 for line in response_data["detail"].split("\n"):
108 |                     error_details += f"    {line}\n"
109 |         except Exception:
110 |             error_details += f"\nResponse body: {error.response.text}"
111 | 
112 |     return error_details
113 | 


--------------------------------------------------------------------------------
/tests/.gitignore:
--------------------------------------------------------------------------------
1 | test_outputs/
2 | 


--------------------------------------------------------------------------------
/tests/__init__.py:
--------------------------------------------------------------------------------
1 | import pathlib
2 | 
3 | TESTS_DIR = pathlib.Path(__file__).parent
4 | CASSETTES_DIR = TESTS_DIR / "cassettes"
5 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMCallOp.test_cost_tracking.yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "Generate a story"}], "model":
  5 |         "gpt-3.5-turbo", "temperature": 0.1, "tool_choice": "required", "tools": [{"type":
  6 |         "function", "function": {"name": "generate_story", "description": "Generate
  7 |         a story.", "parameters": {"type": "object", "properties": {}, "required": []}}}]}'
  8 |       headers:
  9 |         accept:
 10 |           - application/json
 11 |         accept-encoding:
 12 |           - gzip, deflate
 13 |         connection:
 14 |           - keep-alive
 15 |         content-length:
 16 |           - "313"
 17 |         content-type:
 18 |           - application/json
 19 |         host:
 20 |           - api.openai.com
 21 |         user-agent:
 22 |           - AsyncOpenAI/Python 1.54.3
 23 |         x-stainless-arch:
 24 |           - arm64
 25 |         x-stainless-async:
 26 |           - async:asyncio
 27 |         x-stainless-lang:
 28 |           - python
 29 |         x-stainless-os:
 30 |           - MacOS
 31 |         x-stainless-package-version:
 32 |           - 1.54.3
 33 |         x-stainless-raw-response:
 34 |           - "true"
 35 |         x-stainless-retry-count:
 36 |           - "0"
 37 |         x-stainless-runtime:
 38 |           - CPython
 39 |         x-stainless-runtime-version:
 40 |           - 3.12.7
 41 |       method: POST
 42 |       uri: https://api.openai.com/v1/chat/completions
 43 |     response:
 44 |       body:
 45 |         string: !!binary |
 46 |           H4sIAAAAAAAAA4xT70/bMBD9nr/Cus8talJ+lHxjElQgmCaYmGCaIte5JgbH9uwLW1X1f5+clCQt
 47 |           RVo+WNa9e+/enS/riDGQOaQMRMlJVFaNL+4f8vj58vnH9Vx9eTp/LZOvZXH75+14fhWfwigwzOIF
 48 |           Bb2zjoSprEKSRrewcMgJg2p8No3jySw5PWuAyuSoAq2wNJ4enYypdgsznsTJyZZZGinQQ8p+Rowx
 49 |           tm7O4FHn+BdSNhm9Ryr0nhcIaZfEGDijQgS499IT1wSjHhRGE+pgW9dKDQAyRmWCK9UXbr/14N4P
 50 |           iiuV2SS5eNA35uXpbjp/u53MH3/ffPs+ux/Ua6VXtjG0rLXoBjTAu3i6V4wx0LxquAVqdJww82Tc
 51 |           ak+BMeCuqCvUFNzDegM7+CY6dP816N7hsvZcbceyjW+6OStTWGcWfm9ssJRa+jJzyH1jHzwZ29YO
 52 |           dZoKUO88EVhnKksZmVfUQfA4buWg36AenG0xMsTVgHM+OiCW5UhcNg/Y7YzgosS8Z/a7w+tcmgEQ
 53 |           DVr+6OWQdtu21MX/yPeAEGgJ88w6zKXY7bdPcxh+r8/SuhE3hsGvPGGVLaUu0FknuwWPNtE/AAAA
 54 |           //8DAKbQ9nDfAwAA
 55 |       headers:
 56 |         CF-Cache-Status:
 57 |           - DYNAMIC
 58 |         CF-RAY:
 59 |           - 8df951106c0fce74-SJC
 60 |         Connection:
 61 |           - keep-alive
 62 |         Content-Encoding:
 63 |           - gzip
 64 |         Content-Type:
 65 |           - application/json
 66 |         Date:
 67 |           - Fri, 08 Nov 2024 23:24:28 GMT
 68 |         Server:
 69 |           - cloudflare
 70 |         Set-Cookie:
 71 |           - __cf_bm=rCyb7ZMvV5wiHKaeBdiNZlwHnkJK6tg2ANDGf7CLuDQ-1731108268-1.0.1.1-TV4yUO3TR983XeJzGOzeANJ9oow4wDmcxbZ8oaqgrJOQPEhkWv2F4Z.ZGNjzmCoXE.kIh6uVXz.pbGFeFvPSOQ;
 72 |             path=/; expires=Fri, 08-Nov-24 23:54:28 GMT; domain=.api.openai.com; HttpOnly;
 73 |             Secure; SameSite=None
 74 |           - _cfuvid=mB2ccx6IlyDMQkGU81Vj.KiHjbPKz88kyBcj9Q5UQCk-1731108268004-0.0.1.1-604800000;
 75 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 76 |         Transfer-Encoding:
 77 |           - chunked
 78 |         X-Content-Type-Options:
 79 |           - nosniff
 80 |         access-control-expose-headers:
 81 |           - X-Request-ID
 82 |         alt-svc:
 83 |           - h3=":443"; ma=86400
 84 |         openai-organization:
 85 |           - future-house-xr4tdh
 86 |         openai-processing-ms:
 87 |           - "281"
 88 |         openai-version:
 89 |           - "2020-10-01"
 90 |         strict-transport-security:
 91 |           - max-age=31536000; includeSubDomains; preload
 92 |         x-ratelimit-limit-requests:
 93 |           - "12000"
 94 |         x-ratelimit-limit-tokens:
 95 |           - "1000000"
 96 |         x-ratelimit-remaining-requests:
 97 |           - "11999"
 98 |         x-ratelimit-remaining-tokens:
 99 |           - "999978"
100 |         x-ratelimit-reset-requests:
101 |           - 5ms
102 |         x-ratelimit-reset-tokens:
103 |           - 1ms
104 |         x-request-id:
105 |           - req_448537f2622e7777bbf6f0e7ff4bb17e
106 |       status:
107 |         code: 200
108 |         message: OK
109 | version: 1
110 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMCallOp.test_empty_tools.yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "Hello"}], "model": "gpt-4o-mini-2024-07-18",
  5 |         "max_tokens": 4096, "n": 1, "temperature": 0.1}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "135"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.59.9
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.59.9
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAAwAAAP//jFJBbtswELzrFds9W4UtB43sS5A2QdLm2gYBikKgyZXMhOISJNXWCPz3
 45 |           gpJtyWgL5KLDzM5oZrmvGQBqhWtAuRVRts7k15392BWrTw+Pj/Z29c09FdeKHr7cfe2eixucJQVv
 46 |           nknGo+q95NYZiprtQEtPIlJyXVwuy/mqLIuiJ1pWZJKscTG/4LzVVufFvLjI55f5ojyot6wlBVzD
 47 |           9wwA4LX/ppxW0W9cw3x2RFoKQTSE69MQAHo2CUERgg5R2IizkZRsI9k++j0Zw+/gnn+BFBY+wyCA
 48 |           HXcQWYnd1VToqe6CSOFtZ8wB35+SGG6c50048Ce81laHbeVJBLbpryGyw57dZwA/+sbdWQl0nlsX
 49 |           q8gvZJNhObjhuOaRWxyWgZGjMBP8KDozqxRFoU2YLAylkFtSo3LcruiU5gmRTSr/HeZf3kNtbZu3
 50 |           2I+ElOQiqcp5UlqeFx7HPKUj/N/YacV9YAzkf2pJVdTk0zMoqkVnhtPAsAuR2qrWtiHvvB7uo3bV
 51 |           RpXLZbGqPywx22d/AAAA//8DAGvr9u8tAwAA
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 9093fce7094e642c-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Tue, 28 Jan 2025 21:13:42 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=mxF_vDWaXSGuf9hKQnemjKvROt3mU3dFb69K_cFGmWA-1738098822-1.0.1.1-U9A9Wj1HMiApuDMzvl0Sz6xbEsOPlP3NiSxSQ1wVHhepccJyasTXm021aYIJ4kf5bGdc6KT_qLtB0wqQNwMTkg;
 69 |             path=/; expires=Tue, 28-Jan-25 21:43:42 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=tS3l16tuNKSemon6BRJsWhoLLS9VzvAut45DhtCV.Bk-1738098822778-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         openai-organization:
 82 |           - future-house-xr4tdh
 83 |         openai-processing-ms:
 84 |           - "399"
 85 |         openai-version:
 86 |           - "2020-10-01"
 87 |         strict-transport-security:
 88 |           - max-age=31536000; includeSubDomains; preload
 89 |         x-ratelimit-limit-requests:
 90 |           - "30000"
 91 |         x-ratelimit-limit-tokens:
 92 |           - "150000000"
 93 |         x-ratelimit-remaining-requests:
 94 |           - "29999"
 95 |         x-ratelimit-remaining-tokens:
 96 |           - "149995900"
 97 |         x-ratelimit-reset-requests:
 98 |           - 2ms
 99 |         x-ratelimit-reset-tokens:
100 |           - 1ms
101 |         x-request-id:
102 |           - req_e420e89656c3bae9b35eae4dbd97d277
103 |       status:
104 |         code: 200
105 |         message: OK
106 | version: 1
107 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMCallOp.test_validation.yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "Hello"}], "model": "gpt-4o-mini-2024-07-18",
  5 |         "n": 1}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "95"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.59.7
 21 |         x-stainless-arch:
 22 |           - x64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - Linux
 29 |         x-stainless-package-version:
 30 |           - 1.59.7
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.4
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAA4xSwY7TMBC95yuGOTcoLV2l7QUhkOhKe4ADEssKRa49SQ2Ox9jOQrXqvyMnbZMK
 45 |           VtpLDu/Ne3lvPE8ZAGqFG0C5F1G2zuTvfr0v17vV/debg/h2t+WPj59UWX6+X3+4+3KLs6Tg3Q+S
 46 |           8ax6Lbl1hqJmO9DSk4iUXOflm7IoFutV2RMtKzJJ1riYLzlvtdX5olgs86LM56uTes9aUsANPGQA
 47 |           AE/9N+W0iv7gBorZGWkpBNEQbi5DAOjZJARFCDpEYSPORlKyjWT76Fsyhl/Bln+DFBZuYRDAgTuI
 48 |           rMTh7VToqe6CSOFtZ8wJP16SGG6c51048Re81laHfeVJBLbpryGyw549ZgDf+8bdVQl0nlsXq8g/
 49 |           ySbD1eCG45pHbn5aBkaOwkzws+jKrFIUhTZhsjCUQu5Jjcpxu6JTmidENqn8b5j/eQ+1tW1eYj8S
 50 |           UpKLpCrnSWl5XXgc85SO8Lmxy4r7wBjIP2pJVdTk0zMoqkVnhtPAcAiR2qrWtiHvvB7uo3ZVuSBV
 51 |           it3NUmJ2zP4CAAD//wMAc2QAgS0DAAA=
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 902b7b21ef9cba21-SEA
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Thu, 16 Jan 2025 04:49:48 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=940efh6IXrRBGzKpiScnpcSFSq.Qq5h.tZsG.tFRuXE-1737002988-1.0.1.1-glrn9jp0jJubbYQm1IpaQ0F7.hBwZxBO7pjIgct3Hry182dHr7EMmLLb4RleHEPiSBfV0OrZD33VvlywHYIHwg;
 69 |             path=/; expires=Thu, 16-Jan-25 05:19:48 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=fAwazJ9ZSOYywFdRAWoUeWZsgr45nzOyAHTcLlcUSP0-1737002988356-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         openai-organization:
 82 |           - future-house-xr4tdh
 83 |         openai-processing-ms:
 84 |           - "404"
 85 |         openai-version:
 86 |           - "2020-10-01"
 87 |         strict-transport-security:
 88 |           - max-age=31536000; includeSubDomains; preload
 89 |         x-ratelimit-limit-requests:
 90 |           - "30000"
 91 |         x-ratelimit-limit-tokens:
 92 |           - "150000000"
 93 |         x-ratelimit-remaining-requests:
 94 |           - "29999"
 95 |         x-ratelimit-remaining-tokens:
 96 |           - "149999981"
 97 |         x-ratelimit-reset-requests:
 98 |           - 2ms
 99 |         x-ratelimit-reset-tokens:
100 |           - 0s
101 |         x-request-id:
102 |           - req_0ee9e043e2ad94fb0c69ad10bdbfa73e
103 |       status:
104 |         code: 200
105 |         message: OK
106 | version: 1
107 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_model[claude-3-haiku-20240307].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"messages": [{"role": "user", "content": [{"type": "text", "text": "Hello,
 5 |         how are you?"}]}], "system": [{"type": "text", "text": "Respond with single
 6 |         words."}], "max_tokens": 4096, "model": "claude-3-haiku-20240307"}'
 7 |       headers:
 8 |         accept:
 9 |           - application/json
10 |         accept-encoding:
11 |           - gzip, deflate
12 |         anthropic-version:
13 |           - "2023-06-01"
14 |         connection:
15 |           - keep-alive
16 |         content-length:
17 |           - "218"
18 |         content-type:
19 |           - application/json
20 |         host:
21 |           - api.anthropic.com
22 |         user-agent:
23 |           - litellm/1.52.3
24 |       method: POST
25 |       uri: https://api.anthropic.com/v1/messages
26 |     response:
27 |       body:
28 |         string: !!binary |
29 |           H4sIAAAAAAAAA1SOzWrCQBSF3+WsJzJqsHW2LXSjoLRQipQwJBcdMrkTc+9AJeTdS8QuujrwnR/O
30 |           iNDAoZNzZZfl7eO4fXl7v7yGzXN92Hfhuuu+YKC3nuYUifgzwWBIcQZeJIh6Vhh0qaEIhzr63FCx
31 |           Li4+tLlY2VVp1/YJBnViJVa40/i3qPQzd+/i8EkxLjB9G4imvhrIS2I4EDeV5oHxMISumbgmOM4x
32 |           GuT7KzcicJ+10tQSC9xya5Cy/kN2mn4BAAD//wMA53MTs/MAAAA=
33 |       headers:
34 |         CF-Cache-Status:
35 |           - DYNAMIC
36 |         CF-RAY:
37 |           - 8df951213bb996c9-SJC
38 |         Connection:
39 |           - keep-alive
40 |         Content-Encoding:
41 |           - gzip
42 |         Content-Type:
43 |           - application/json
44 |         Date:
45 |           - Fri, 08 Nov 2024 23:24:30 GMT
46 |         Server:
47 |           - cloudflare
48 |         Transfer-Encoding:
49 |           - chunked
50 |         X-Robots-Tag:
51 |           - none
52 |         anthropic-ratelimit-requests-limit:
53 |           - "5000"
54 |         anthropic-ratelimit-requests-remaining:
55 |           - "4999"
56 |         anthropic-ratelimit-requests-reset:
57 |           - "2024-11-08T23:25:12Z"
58 |         anthropic-ratelimit-tokens-limit:
59 |           - "5000000"
60 |         anthropic-ratelimit-tokens-remaining:
61 |           - "5000000"
62 |         anthropic-ratelimit-tokens-reset:
63 |           - "2024-11-08T23:24:30Z"
64 |         request-id:
65 |           - req_01Ri7jk6wtRpYL45Y9DA7ubB
66 |         via:
67 |           - 1.1 google
68 |       status:
69 |         code: 200
70 |         message: OK
71 | version: 1
72 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_model[gpt-3.5-turbo].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "Hello, how are you?"}], "model": "gpt-3.5-turbo"}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "153"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.54.3
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.54.3
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "1"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAA4ySMWvDMBCFd/8KodkOttOkwVspFEqXknQrxcjSxVYjS0I6l5SQ/17kJLZDU+ii
 45 |           4b57T+9OOkSEUCloQShvGPLWquRhvRHpy93q0b3m+qvp9vgM2bp629mNzWkcFKb6BI4X1Yyb1ipA
 46 |           afQJcwcMIbhm9/MsS1f5ctmD1ghQQVZbTOazRYKdq0ySZvnirGyM5OBpQd4jQgg59GfIqAXsaUHS
 47 |           +FJpwXtWAy2GJkKoMypUKPNeemQaaTxCbjSC7mM/SQ1T5GDbeRai6U6pc/043KVMbZ2p/JkP9a3U
 48 |           0jelA+aNDr4ejaU9PUaEfPQzdVcxqXWmtVii2YEOhnl+sqPjFkeYnRkaZGqimcc3zEoByKTyk5VQ
 49 |           zngDYlSO+2OdkGYCosnIv7Pc8j6NLXX9H/sRcA4WQZTWgZD8et6xzUH4Yn+1DSvuA1P/7RHacit1
 50 |           Dc462T9y/5LH6AcAAP//AwCdh9cz4wIAAA==
 51 |       headers:
 52 |         CF-Cache-Status:
 53 |           - DYNAMIC
 54 |         CF-RAY:
 55 |           - 8df9510b69f62716-SJC
 56 |         Connection:
 57 |           - keep-alive
 58 |         Content-Encoding:
 59 |           - gzip
 60 |         Content-Type:
 61 |           - application/json
 62 |         Date:
 63 |           - Fri, 08 Nov 2024 23:24:27 GMT
 64 |         Server:
 65 |           - cloudflare
 66 |         Transfer-Encoding:
 67 |           - chunked
 68 |         X-Content-Type-Options:
 69 |           - nosniff
 70 |         access-control-expose-headers:
 71 |           - X-Request-ID
 72 |         alt-svc:
 73 |           - h3=":443"; ma=86400
 74 |         openai-organization:
 75 |           - future-house-xr4tdh
 76 |         openai-processing-ms:
 77 |           - "182"
 78 |         openai-version:
 79 |           - "2020-10-01"
 80 |         strict-transport-security:
 81 |           - max-age=31536000; includeSubDomains; preload
 82 |         x-ratelimit-limit-requests:
 83 |           - "12000"
 84 |         x-ratelimit-limit-tokens:
 85 |           - "1000000"
 86 |         x-ratelimit-remaining-requests:
 87 |           - "11999"
 88 |         x-ratelimit-remaining-tokens:
 89 |           - "999969"
 90 |         x-ratelimit-reset-requests:
 91 |           - 5ms
 92 |         x-ratelimit-reset-tokens:
 93 |           - 1ms
 94 |         x-request-id:
 95 |           - req_c281bfa51f535d6093a3b049c4f0ca93
 96 |       status:
 97 |         code: 200
 98 |         message: OK
 99 | version: 1
100 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_output_schema[json-mode].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages":[{"role":"system","content":"Respond following this JSON schema:\n\n{\"properties\":
  5 |         {\"name\": {\"title\": \"Name\", \"type\": \"string\"}, \"age\": {\"title\":
  6 |         \"Age\", \"type\": \"integer\"}}, \"required\": [\"name\", \"age\"], \"title\":
  7 |         \"DummyOutputSchema\", \"type\": \"object\"}"},{"role":"user","content":"My
  8 |         name is Claude and I am 1 year old. What is my name and age?"}],"model":"gpt-3.5-turbo","response_format":{"type":"json_object"}}'
  9 |       headers:
 10 |         accept:
 11 |           - application/json
 12 |         accept-encoding:
 13 |           - gzip, deflate
 14 |         connection:
 15 |           - keep-alive
 16 |         content-length:
 17 |           - "459"
 18 |         content-type:
 19 |           - application/json
 20 |         host:
 21 |           - api.openai.com
 22 |         user-agent:
 23 |           - AsyncOpenAI/Python 1.55.3
 24 |         x-stainless-arch:
 25 |           - arm64
 26 |         x-stainless-async:
 27 |           - async:asyncio
 28 |         x-stainless-lang:
 29 |           - python
 30 |         x-stainless-os:
 31 |           - MacOS
 32 |         x-stainless-package-version:
 33 |           - 1.55.3
 34 |         x-stainless-raw-response:
 35 |           - "true"
 36 |         x-stainless-retry-count:
 37 |           - "0"
 38 |         x-stainless-runtime:
 39 |           - CPython
 40 |         x-stainless-runtime-version:
 41 |           - 3.12.7
 42 |       method: POST
 43 |       uri: https://api.openai.com/v1/chat/completions
 44 |     response:
 45 |       body:
 46 |         string: !!binary |
 47 |           H4sIAAAAAAAAA4ySQWvjMBCF7/4VYs5JqR1Ktr5ld1lKC720lJa6GEWaOOrKkpBGdJeQ/75IcWKH
 48 |           7sJefHjfzOO9sXYFY6Ak1AzElpPonZ6v+PPdU/d++/0+fPmIq+opPt483/zAh/j1pYJZ2rDrdxR0
 49 |           3LoQtncaSVlzwMIjJ0yu5XKxqJZldV1m0FuJOq11juaLi6s5Rb+288uyuho2t1YJDFCz14Ixxnb5
 50 |           mzIaib+gZpezo9JjCLxDqE9DjIG3OinAQ1CBuCGYjVBYQ2hy7F1jktSA4T02ULMGvmkeJTYwOyLe
 51 |           ZVI2Zj918biJgacWJmo96PtTLG075+06DPykb5RRYdt65MGaFCGQdZDpvmDsLdePZ43Aeds7asn+
 52 |           RJMMrxcHOxgPPsJyOUCyxPVEL4ebndu1EokrHSb3A8HFFuW4Oh6bR6nsBBST0p/T/M37UFyZ7n/s
 53 |           RyAEOkLZOo9SifPG45jH9B7/NXY6cg4M4Xcg7NuNMh1651V+Eflf7os/AAAA//8DAOtt/IcQAwAA
 54 |       headers:
 55 |         CF-Cache-Status:
 56 |           - DYNAMIC
 57 |         CF-RAY:
 58 |           - 8ec79940487acf0a-SJC
 59 |         Connection:
 60 |           - keep-alive
 61 |         Content-Encoding:
 62 |           - gzip
 63 |         Content-Type:
 64 |           - application/json
 65 |         Date:
 66 |           - Wed, 04 Dec 2024 00:14:51 GMT
 67 |         Server:
 68 |           - cloudflare
 69 |         Set-Cookie:
 70 |           - __cf_bm=Jt74XtlzTIX4qJ2I6JWts_1PUt6239EzTEKob0gbMYI-1733271291-1.0.1.1-Q2lRwwtee9d00lyYx_vjY4jpuRYySoyrIe_R4yj2LqAaxIDQLNQ99FxRmToXDEeMUPk5tUL1416FgdY7MIAURA;
 71 |             path=/; expires=Wed, 04-Dec-24 00:44:51 GMT; domain=.api.openai.com; HttpOnly;
 72 |             Secure; SameSite=None
 73 |           - _cfuvid=LgL7hRr_QJbzVlAiPhNhtvybE1Xb67FkF.lr0Cryt2I-1733271291893-0.0.1.1-604800000;
 74 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 75 |         Transfer-Encoding:
 76 |           - chunked
 77 |         X-Content-Type-Options:
 78 |           - nosniff
 79 |         access-control-expose-headers:
 80 |           - X-Request-ID
 81 |         alt-svc:
 82 |           - h3=":443"; ma=86400
 83 |         openai-organization:
 84 |           - future-house-xr4tdh
 85 |         openai-processing-ms:
 86 |           - "255"
 87 |         openai-version:
 88 |           - "2020-10-01"
 89 |         strict-transport-security:
 90 |           - max-age=31536000; includeSubDomains; preload
 91 |         x-ratelimit-limit-requests:
 92 |           - "12000"
 93 |         x-ratelimit-limit-tokens:
 94 |           - "1000000"
 95 |         x-ratelimit-remaining-requests:
 96 |           - "11999"
 97 |         x-ratelimit-remaining-tokens:
 98 |           - "999910"
 99 |         x-ratelimit-reset-requests:
100 |           - 5ms
101 |         x-ratelimit-reset-tokens:
102 |           - 5ms
103 |         x-request-id:
104 |           - req_9f36e635cd12593e29892e9b24310fc6
105 |       status:
106 |         code: 200
107 |         message: OK
108 | version: 1
109 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_output_schema[structured-outputs].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages":[{"role":"user","content":"My name is Claude and I am 1 year
  5 |         old. What is my name and age?"}],"model":"gpt-4o","response_format":{"type":"json_schema","json_schema":{"strict":true,"schema":{"properties":{"name":{"title":"Name","type":"string"},"age":{"title":"Age","type":"integer"}},"required":["name","age"],"title":"DummyOutputSchema","type":"object","additionalProperties":false},"name":"DummyOutputSchema"}}}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "425"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.55.3
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.55.3
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAA4xSu07EMBDs8xXW1gkKCeKOdAgqKCgoeAVFPnuTMzhey3YE6HT/jpx75E6ARONi
 45 |           Zmc8s/YqYQyUhIqBWPIgequzS/748PQh6AKL+5uebOvubuXl1/XzQKWFNCpo8YYi7FQngnqrMSgy
 46 |           G1o45AGj6+msLItZkZfzkehJoo6yzobsjLIiL86yfJ7l51vhkpRADxV7SRhjbDWeMaKR+AkVy9Md
 47 |           0qP3vEOo9kOMgSMdEeDeKx+4CZBOpCAT0IypVzUY3mMNVQ1Xmg8Sa0hr4F2ETteHKoft4HkMbQat
 48 |           t/h6H0NTZx0t/Jbf460yyi8bh9yTiVf6QBZGdp0w9jrWHY4agHXU29AEekcTDWcXGzuY9juROy5Q
 49 |           4HqC5/P0F7NGYuBK+4NtgeBiiXJSTqvlg1R0QCQHlX9m+c17U1uZ7j/2EyEE2oCysQ6lEsd9pzGH
 50 |           8fP9NbZf8RgY/JcP2DetMh0669Tm/VvbzNrzBZbYLnJI1sk3AAAA//8DAEganQUIAwAA
 51 |       headers:
 52 |         CF-Cache-Status:
 53 |           - DYNAMIC
 54 |         CF-RAY:
 55 |           - 8ec7ab7ffe551679-SJC
 56 |         Connection:
 57 |           - keep-alive
 58 |         Content-Encoding:
 59 |           - gzip
 60 |         Content-Type:
 61 |           - application/json
 62 |         Date:
 63 |           - Wed, 04 Dec 2024 00:27:18 GMT
 64 |         Server:
 65 |           - cloudflare
 66 |         Transfer-Encoding:
 67 |           - chunked
 68 |         X-Content-Type-Options:
 69 |           - nosniff
 70 |         access-control-expose-headers:
 71 |           - X-Request-ID
 72 |         alt-svc:
 73 |           - h3=":443"; ma=86400
 74 |         openai-organization:
 75 |           - future-house-xr4tdh
 76 |         openai-processing-ms:
 77 |           - "367"
 78 |         openai-version:
 79 |           - "2020-10-01"
 80 |         strict-transport-security:
 81 |           - max-age=31536000; includeSubDomains; preload
 82 |         x-ratelimit-limit-requests:
 83 |           - "10000"
 84 |         x-ratelimit-limit-tokens:
 85 |           - "30000000"
 86 |         x-ratelimit-remaining-requests:
 87 |           - "9998"
 88 |         x-ratelimit-remaining-tokens:
 89 |           - "29999967"
 90 |         x-ratelimit-reset-requests:
 91 |           - 6ms
 92 |         x-ratelimit-reset-tokens:
 93 |           - 0s
 94 |         x-request-id:
 95 |           - req_b1f66bf72beec8f42091a30db5131d27
 96 |       status:
 97 |         code: 200
 98 |         message: OK
 99 | version: 1
100 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_output_type_rejected_validation.yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"messages": [{"role": "user", "content": [{"type": "text", "text": "What
 5 |         are three things I should do today?"}]}], "temperature": 0.1, "tools": [{"name":
 6 |         "json_tool_call", "input_schema": {"type": "object", "properties": {"values":
 7 |         null}}}], "tool_choice": {"name": "json_tool_call", "type": "tool"}, "system":
 8 |         [{"type": "text", "text": "Respond following this JSON schema:\n\n{\"properties\":
 9 |         {\"instructions\": {\"description\": \"list of instructions\", \"items\": {\"type\":
10 |         \"string\"}, \"title\": \"Instructions\", \"type\": \"array\"}}, \"required\":
11 |         [\"instructions\"], \"title\": \"InstructionList\", \"type\": \"object\"}"}],
12 |         "max_tokens": 4096, "model": "claude-3-haiku-20240307"}'
13 |       headers:
14 |         accept:
15 |           - application/json
16 |         accept-encoding:
17 |           - gzip, deflate
18 |         anthropic-version:
19 |           - "2023-06-01"
20 |         connection:
21 |           - keep-alive
22 |         content-length:
23 |           - "692"
24 |         content-type:
25 |           - application/json
26 |         host:
27 |           - api.anthropic.com
28 |         user-agent:
29 |           - litellm/1.52.5
30 |       method: POST
31 |       uri: https://api.anthropic.com/v1/messages
32 |     response:
33 |       body:
34 |         string:
35 |           '{"type":"error","error":{"type":"invalid_request_error","message":"tools.0.input_schema:
36 |           JSON schema is invalid - please consult https://json-schema.org or our documentation
37 |           at https://docs.anthropic.com/en/docs/tool-use"}}'
38 |       headers:
39 |         CF-Cache-Status:
40 |           - DYNAMIC
41 |         CF-RAY:
42 |           - 8e20db182b2d644d-SJC
43 |         Connection:
44 |           - keep-alive
45 |         Content-Length:
46 |           - "223"
47 |         Content-Type:
48 |           - application/json
49 |         Date:
50 |           - Wed, 13 Nov 2024 18:34:26 GMT
51 |         Server:
52 |           - cloudflare
53 |         X-Robots-Tag:
54 |           - none
55 |         request-id:
56 |           - req_01Ma1cK27HCaupfNBiwTjUFo
57 |         via:
58 |           - 1.1 google
59 |         x-should-retry:
60 |           - "false"
61 |       status:
62 |         code: 400
63 |         message: Bad Request
64 | version: 1
65 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_streaming[gpt-3.5-turbo].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "Hello, how are you?"}], "model": "gpt-3.5-turbo",
  6 |         "stream": true, "stream_options": {"include_usage": true}, "temperature": 0.1}'
  7 |       headers:
  8 |         accept:
  9 |           - application/json
 10 |         accept-encoding:
 11 |           - gzip, deflate
 12 |         connection:
 13 |           - keep-alive
 14 |         content-length:
 15 |           - "232"
 16 |         content-type:
 17 |           - application/json
 18 |         host:
 19 |           - api.openai.com
 20 |         user-agent:
 21 |           - AsyncOpenAI/Python 1.54.3
 22 |         x-stainless-arch:
 23 |           - arm64
 24 |         x-stainless-async:
 25 |           - async:asyncio
 26 |         x-stainless-lang:
 27 |           - python
 28 |         x-stainless-os:
 29 |           - MacOS
 30 |         x-stainless-package-version:
 31 |           - 1.54.3
 32 |         x-stainless-raw-response:
 33 |           - "true"
 34 |         x-stainless-retry-count:
 35 |           - "1"
 36 |         x-stainless-runtime:
 37 |           - CPython
 38 |         x-stainless-runtime-version:
 39 |           - 3.12.7
 40 |       method: POST
 41 |       uri: https://api.openai.com/v1/chat/completions
 42 |     response:
 43 |       body:
 44 |         string:
 45 |           'data: {"id":"chatcmpl-ARSd2K2L3Lg87wmLEtOKlJ3tLCQem","object":"chat.completion.chunk","created":1731108268,"model":"gpt-3.5-turbo-0125","system_fingerprint":null,"choices":[{"index":0,"delta":{"role":"assistant","content":"","refusal":null},"logprobs":null,"finish_reason":null}],"usage":null}
 46 | 
 47 | 
 48 |           data: {"id":"chatcmpl-ARSd2K2L3Lg87wmLEtOKlJ3tLCQem","object":"chat.completion.chunk","created":1731108268,"model":"gpt-3.5-turbo-0125","system_fingerprint":null,"choices":[{"index":0,"delta":{"content":"Good"},"logprobs":null,"finish_reason":null}],"usage":null}
 49 | 
 50 | 
 51 |           data: {"id":"chatcmpl-ARSd2K2L3Lg87wmLEtOKlJ3tLCQem","object":"chat.completion.chunk","created":1731108268,"model":"gpt-3.5-turbo-0125","system_fingerprint":null,"choices":[{"index":0,"delta":{},"logprobs":null,"finish_reason":"stop"}],"usage":null}
 52 | 
 53 | 
 54 |           data: {"id":"chatcmpl-ARSd2K2L3Lg87wmLEtOKlJ3tLCQem","object":"chat.completion.chunk","created":1731108268,"model":"gpt-3.5-turbo-0125","system_fingerprint":null,"choices":[],"usage":{"prompt_tokens":22,"completion_tokens":1,"total_tokens":23,"prompt_tokens_details":{"cached_tokens":0,"audio_tokens":0},"completion_tokens_details":{"reasoning_tokens":0,"audio_tokens":0,"accepted_prediction_tokens":0,"rejected_prediction_tokens":0}}}
 55 | 
 56 | 
 57 |           data: [DONE]
 58 | 
 59 | 
 60 |           '
 61 |       headers:
 62 |         CF-Cache-Status:
 63 |           - DYNAMIC
 64 |         CF-RAY:
 65 |           - 8df951133c95cf4d-SJC
 66 |         Connection:
 67 |           - keep-alive
 68 |         Content-Type:
 69 |           - text/event-stream; charset=utf-8
 70 |         Date:
 71 |           - Fri, 08 Nov 2024 23:24:28 GMT
 72 |         Server:
 73 |           - cloudflare
 74 |         Transfer-Encoding:
 75 |           - chunked
 76 |         X-Content-Type-Options:
 77 |           - nosniff
 78 |         access-control-expose-headers:
 79 |           - X-Request-ID
 80 |         alt-svc:
 81 |           - h3=":443"; ma=86400
 82 |         openai-organization:
 83 |           - future-house-xr4tdh
 84 |         openai-processing-ms:
 85 |           - "197"
 86 |         openai-version:
 87 |           - "2020-10-01"
 88 |         strict-transport-security:
 89 |           - max-age=31536000; includeSubDomains; preload
 90 |         x-ratelimit-limit-requests:
 91 |           - "12000"
 92 |         x-ratelimit-limit-tokens:
 93 |           - "1000000"
 94 |         x-ratelimit-remaining-requests:
 95 |           - "11999"
 96 |         x-ratelimit-remaining-tokens:
 97 |           - "999969"
 98 |         x-ratelimit-reset-requests:
 99 |           - 5ms
100 |         x-ratelimit-reset-tokens:
101 |           - 1ms
102 |         x-request-id:
103 |           - req_378b8fdfe73f1f24710faf4cdc08d994
104 |       status:
105 |         code: 200
106 |         message: OK
107 | version: 1
108 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_text_image_message[claude-3-haiku-20240307].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"messages": [{"role": "user", "content": [{"type": "image", "source":
 5 |         {"type": "base64", "media_type": "image/png", "data": "iVBORw0KGgoAAAANSUhEUgAAACAAAAAgCAIAAAD8GO2jAAAAKElEQVR4nO3NMQEAAAjDMMC/ZzDBvlRA01vZJvwHAAAAAAAAAAAAbx2jxAE/i2AjOgAAAABJRU5ErkJggg=="}},
 6 |         {"type": "text", "text": "What color is this square? Respond only with the color
 7 |         name."}]}], "max_tokens": 4096, "model": "claude-3-haiku-20240307"}'
 8 |       headers:
 9 |         accept:
10 |           - application/json
11 |         accept-encoding:
12 |           - gzip, deflate
13 |         anthropic-version:
14 |           - "2023-06-01"
15 |         connection:
16 |           - keep-alive
17 |         content-length:
18 |           - "411"
19 |         content-type:
20 |           - application/json
21 |         host:
22 |           - api.anthropic.com
23 |         user-agent:
24 |           - litellm/1.52.3
25 |       method: POST
26 |       uri: https://api.anthropic.com/v1/messages
27 |     response:
28 |       body:
29 |         string: !!binary |
30 |           H4sIAAAAAAAAA0yOzWrDMBCE32XOcnHtQIjOuRZKrqUYYW1cEXnleHdbF+N3Lw4t9DTwzQ+zIkV4
31 |           jDJ09fNpGD+vsnxdDq/ntIzty3mw6wwH/Z5oT5FIGAgOc8k7CCJJNLDCYSyRMjz6HCxS1VYfId2s
32 |           aurmULf1EQ59YSVW+Lf1b1Fp2bsP8bhQfML27iBapm6mIIXhQRw7tZnxawjdjbgneLacHexxyq9I
33 |           PJl2Wm7EAt+cHIrpf3Tcth8AAAD//wMASKMtgPEAAAA=
34 |       headers:
35 |         CF-Cache-Status:
36 |           - DYNAMIC
37 |         CF-RAY:
38 |           - 8df951169f4d1563-SJC
39 |         Connection:
40 |           - keep-alive
41 |         Content-Encoding:
42 |           - gzip
43 |         Content-Type:
44 |           - application/json
45 |         Date:
46 |           - Fri, 08 Nov 2024 23:24:28 GMT
47 |         Server:
48 |           - cloudflare
49 |         Transfer-Encoding:
50 |           - chunked
51 |         X-Robots-Tag:
52 |           - none
53 |         anthropic-ratelimit-requests-limit:
54 |           - "5000"
55 |         anthropic-ratelimit-requests-remaining:
56 |           - "4999"
57 |         anthropic-ratelimit-requests-reset:
58 |           - "2024-11-08T23:25:12Z"
59 |         anthropic-ratelimit-tokens-limit:
60 |           - "5000000"
61 |         anthropic-ratelimit-tokens-remaining:
62 |           - "5000000"
63 |         anthropic-ratelimit-tokens-reset:
64 |           - "2024-11-08T23:24:28Z"
65 |         request-id:
66 |           - req_01MCaZRsMu3nB5nTfMA4ahTw
67 |         via:
68 |           - 1.1 google
69 |       status:
70 |         code: 200
71 |         message: OK
72 | version: 1
73 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLLMModel.test_text_image_message[gpt-4o-mini-2024-07-18].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": [{"type": "image_url", "image_url":
  5 |         {"url": "data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgCAIAAAD8GO2jAAAAKElEQVR4nO3NMQEAAAjDMMC/ZzDBvlRA01vZJvwHAAAAAAAAAAAAbx2jxAE/i2AjOgAAAABJRU5ErkJggg=="}},
  6 |         {"type": "text", "text": "What color is this square? Respond only with the color
  7 |         name."}]}], "model": "gpt-4o-mini-2024-07-18"}'
  8 |       headers:
  9 |         accept:
 10 |           - application/json
 11 |         accept-encoding:
 12 |           - gzip, deflate
 13 |         connection:
 14 |           - keep-alive
 15 |         content-length:
 16 |           - "373"
 17 |         content-type:
 18 |           - application/json
 19 |         host:
 20 |           - api.openai.com
 21 |         user-agent:
 22 |           - AsyncOpenAI/Python 1.54.3
 23 |         x-stainless-arch:
 24 |           - arm64
 25 |         x-stainless-async:
 26 |           - async:asyncio
 27 |         x-stainless-lang:
 28 |           - python
 29 |         x-stainless-os:
 30 |           - MacOS
 31 |         x-stainless-package-version:
 32 |           - 1.54.3
 33 |         x-stainless-raw-response:
 34 |           - "true"
 35 |         x-stainless-retry-count:
 36 |           - "1"
 37 |         x-stainless-runtime:
 38 |           - CPython
 39 |         x-stainless-runtime-version:
 40 |           - 3.12.7
 41 |       method: POST
 42 |       uri: https://api.openai.com/v1/chat/completions
 43 |     response:
 44 |       body:
 45 |         string: !!binary |
 46 |           H4sIAAAAAAAAA4ySzWrDMBCE734KoXNcYjs/Tm6FEuilLUnppRQjSxtHjawVkgxtQ969yHFih7bQ
 47 |           iw/77Yxn1j5EhFAp6JJQvmOe10bFt+uNyPTdepUvnh6zJtunm9WXNfgsX+4f6CgosHwH7s+qG461
 48 |           UeAl6hPmFpiH4JrMsyQZ5+ls0YIaBaggq4yPJxjXUss4HaeTeDyPk7xT71BycHRJXiNCCDm0z5BT
 49 |           C/igSzIenSc1OMcqoMvLEiHUogoTypyTzjPt6aiHHLUH3UZfgxgSC9vGsZBON0p18+PlVQorY7F0
 50 |           Hb/Mt1JLtyssMIc62DqPhrb0GBHy1lZqrlJSY7E2vvC4Bx0M82nadaL9KXucdMyjZ+pKdSZXhoUA
 51 |           z6Ryg6tQzvgORK/tT8gaIXEAokHtn2l+8z5Vl7r6j30POAfjQRTGgpD8unG/ZiH8aX+tXc7cBqbu
 52 |           03moi63UFVhj5ek7b02xKOd5OUv4NKXRMfoGAAD//wMAHblqFfUCAAA=
 53 |       headers:
 54 |         CF-Cache-Status:
 55 |           - DYNAMIC
 56 |         CF-RAY:
 57 |           - 8df951157da42350-SJC
 58 |         Connection:
 59 |           - keep-alive
 60 |         Content-Encoding:
 61 |           - gzip
 62 |         Content-Type:
 63 |           - application/json
 64 |         Date:
 65 |           - Fri, 08 Nov 2024 23:24:29 GMT
 66 |         Server:
 67 |           - cloudflare
 68 |         Transfer-Encoding:
 69 |           - chunked
 70 |         X-Content-Type-Options:
 71 |           - nosniff
 72 |         access-control-expose-headers:
 73 |           - X-Request-ID
 74 |         alt-svc:
 75 |           - h3=":443"; ma=86400
 76 |         openai-organization:
 77 |           - future-house-xr4tdh
 78 |         openai-processing-ms:
 79 |           - "1481"
 80 |         openai-version:
 81 |           - "2020-10-01"
 82 |         strict-transport-security:
 83 |           - max-age=31536000; includeSubDomains; preload
 84 |         x-ratelimit-limit-input-images:
 85 |           - "50000"
 86 |         x-ratelimit-limit-requests:
 87 |           - "30000"
 88 |         x-ratelimit-limit-tokens:
 89 |           - "150000000"
 90 |         x-ratelimit-remaining-input-images:
 91 |           - "49999"
 92 |         x-ratelimit-remaining-requests:
 93 |           - "29999"
 94 |         x-ratelimit-remaining-tokens:
 95 |           - "149999202"
 96 |         x-ratelimit-reset-input-images:
 97 |           - 1ms
 98 |         x-ratelimit-reset-requests:
 99 |           - 2ms
100 |         x-ratelimit-reset-tokens:
101 |           - 0s
102 |         x-request-id:
103 |           - req_d6479069b3a902d72775895cd95ea324
104 |       status:
105 |         code: 200
106 |         message: OK
107 | version: 1
108 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestLiteEmbeddingModel.test_caching.yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"input": ["test1"], "model": "text-embedding-3-small", "dimensions": 8,
  5 |         "encoding_format": "float"}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "100"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.54.3
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.54.3
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "1"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/embeddings
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAA1yQXWvDIBSG7/MrDue6KX4cP+JfGWXYKSWbiWVxUCj97yMu6+K8UHh88PW89w4A
 45 |           8/k9vhV0gGlcCh5WFnzx6OClAwC4170x43SOIYzzper1cpxDvKED9iR/0u9L6+rZkRMJ4ooODdSa
 46 |           Bst2kB0tESPijSesUpq4bSAzSpI0TP9XmTFGtDlysFoKvs8RQlmyetjQqZ6PDuBU25hyiGkdu8Rb
 47 |           6Z9j9bJfJp/ST2Vfi79EdFtbeP3M07W8lvwR5wUdbJ/AkotPO9ytQY/uGwAA//8DAOb7reqKAQAA
 48 |       headers:
 49 |         CF-Cache-Status:
 50 |           - DYNAMIC
 51 |         CF-RAY:
 52 |           - 8df950fdab81cf65-SJC
 53 |         Connection:
 54 |           - keep-alive
 55 |         Content-Encoding:
 56 |           - gzip
 57 |         Content-Type:
 58 |           - application/json
 59 |         Date:
 60 |           - Fri, 08 Nov 2024 23:24:24 GMT
 61 |         Server:
 62 |           - cloudflare
 63 |         Transfer-Encoding:
 64 |           - chunked
 65 |         X-Content-Type-Options:
 66 |           - nosniff
 67 |         access-control-allow-origin:
 68 |           - "*"
 69 |         access-control-expose-headers:
 70 |           - X-Request-ID
 71 |         alt-svc:
 72 |           - h3=":443"; ma=86400
 73 |         openai-model:
 74 |           - text-embedding-3-small
 75 |         openai-organization:
 76 |           - future-house-xr4tdh
 77 |         openai-processing-ms:
 78 |           - "64"
 79 |         openai-version:
 80 |           - "2020-10-01"
 81 |         strict-transport-security:
 82 |           - max-age=31536000; includeSubDomains; preload
 83 |         x-ratelimit-limit-requests:
 84 |           - "10000"
 85 |         x-ratelimit-limit-tokens:
 86 |           - "10000000"
 87 |         x-ratelimit-remaining-requests:
 88 |           - "9999"
 89 |         x-ratelimit-remaining-tokens:
 90 |           - "9991004"
 91 |         x-ratelimit-reset-requests:
 92 |           - 6ms
 93 |         x-ratelimit-reset-tokens:
 94 |           - 53ms
 95 |         x-request-id:
 96 |           - req_f154c6c0d1f72d1496189b1dc8372122
 97 |       status:
 98 |         code: 200
 99 |         message: OK
100 | version: 1
101 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestMultipleCompletionLLMModel.test_model[gpt-3.5-turbo].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "system", "content": "Respond with single words."},
  5 |         {"role": "user", "content": "Hello, how are you?"}], "model": "gpt-3.5-turbo",
  6 |         "n": 2}'
  7 |       headers:
  8 |         accept:
  9 |           - application/json
 10 |         accept-encoding:
 11 |           - gzip, deflate
 12 |         connection:
 13 |           - keep-alive
 14 |         content-length:
 15 |           - "161"
 16 |         content-type:
 17 |           - application/json
 18 |         host:
 19 |           - api.openai.com
 20 |         user-agent:
 21 |           - AsyncOpenAI/Python 1.54.3
 22 |         x-stainless-arch:
 23 |           - arm64
 24 |         x-stainless-async:
 25 |           - async:asyncio
 26 |         x-stainless-lang:
 27 |           - python
 28 |         x-stainless-os:
 29 |           - MacOS
 30 |         x-stainless-package-version:
 31 |           - 1.54.3
 32 |         x-stainless-raw-response:
 33 |           - "true"
 34 |         x-stainless-retry-count:
 35 |           - "1"
 36 |         x-stainless-runtime:
 37 |           - CPython
 38 |         x-stainless-runtime-version:
 39 |           - 3.12.7
 40 |       method: POST
 41 |       uri: https://api.openai.com/v1/chat/completions
 42 |     response:
 43 |       body:
 44 |         string: !!binary |
 45 |           H4sIAAAAAAAAA7RTsW7CMBDd8xWWZ0CEFNGysbSIpVIrsVRVZOwjGByfa18qEOLfKwdKgqBSh3bx
 46 |           cO/e83t39j5hjGvFx4zLlSBZOtOdvLyq7Sb78NNl9vn88Ojms918odczv72b8E5k4GINkr5ZPYml
 47 |           M0Aa7RGWHgRBVE1HWZr277PBsAZKVGAirXDUzXrDLlV+gd1+OhiemCvUEgIfs7eEMcb29Rk9WgVb
 48 |           Pmb9znelhBBEAXx8bmKMezSxwkUIOpCwxDsNKNES2Nr2E6JqQx6WVRDRmq2MOdUP57sMFs7jIpzw
 49 |           c32prQ6r3IMIaKNuIHQ8aZGvAqR/E2AKxmCPxRy9fw6SMPZeL6e6sMudx9JRTrgBGwUHg6Mcb55D
 50 |           Aw5PGCEJ0+KMOjfEcgUktAmt0XAp5ApUw2wegqiUxhbQHv+1l1vax9jaFr+RbwApwRGo3HlQWl7m
 51 |           bdo8xL/yU9t5xLVhHnaBoMyX2hbgndf1sutNHpIvAAAA//8DADNNhHOsAwAA
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 8df9527aaebbcfa8-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Fri, 08 Nov 2024 23:25:25 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Transfer-Encoding:
 68 |           - chunked
 69 |         X-Content-Type-Options:
 70 |           - nosniff
 71 |         access-control-expose-headers:
 72 |           - X-Request-ID
 73 |         alt-svc:
 74 |           - h3=":443"; ma=86400
 75 |         openai-organization:
 76 |           - future-house-xr4tdh
 77 |         openai-processing-ms:
 78 |           - "188"
 79 |         openai-version:
 80 |           - "2020-10-01"
 81 |         strict-transport-security:
 82 |           - max-age=31536000; includeSubDomains; preload
 83 |         x-ratelimit-limit-requests:
 84 |           - "12000"
 85 |         x-ratelimit-limit-tokens:
 86 |           - "1000000"
 87 |         x-ratelimit-remaining-requests:
 88 |           - "11999"
 89 |         x-ratelimit-remaining-tokens:
 90 |           - "999953"
 91 |         x-ratelimit-reset-requests:
 92 |           - 5ms
 93 |         x-ratelimit-reset-tokens:
 94 |           - 2ms
 95 |         x-request-id:
 96 |           - req_bcb3d0f3b0c9612ae3e97088211a9b9b
 97 |       status:
 98 |         code: 200
 99 |         message: OK
100 | version: 1
101 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestMultipleCompletionLLMModel.test_output_schema[json-mode].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages":[{"role":"system","content":"Respond following this JSON schema:\n\n{\"properties\":
  5 |         {\"name\": {\"title\": \"Name\", \"type\": \"string\"}, \"age\": {\"title\":
  6 |         \"Age\", \"type\": \"integer\"}}, \"required\": [\"name\", \"age\"], \"title\":
  7 |         \"DummyOutputSchema\", \"type\": \"object\"}"},{"role":"user","content":"My
  8 |         name is Claude and I am 1 year old. What is my name and age?"}],"model":"gpt-3.5-turbo","n":2,"response_format":{"type":"json_object"}}'
  9 |       headers:
 10 |         accept:
 11 |           - application/json
 12 |         accept-encoding:
 13 |           - gzip, deflate
 14 |         connection:
 15 |           - keep-alive
 16 |         content-length:
 17 |           - "465"
 18 |         content-type:
 19 |           - application/json
 20 |         host:
 21 |           - api.openai.com
 22 |         user-agent:
 23 |           - AsyncOpenAI/Python 1.55.3
 24 |         x-stainless-arch:
 25 |           - arm64
 26 |         x-stainless-async:
 27 |           - async:asyncio
 28 |         x-stainless-lang:
 29 |           - python
 30 |         x-stainless-os:
 31 |           - MacOS
 32 |         x-stainless-package-version:
 33 |           - 1.55.3
 34 |         x-stainless-raw-response:
 35 |           - "true"
 36 |         x-stainless-retry-count:
 37 |           - "0"
 38 |         x-stainless-runtime:
 39 |           - CPython
 40 |         x-stainless-runtime-version:
 41 |           - 3.12.7
 42 |       method: POST
 43 |       uri: https://api.openai.com/v1/chat/completions
 44 |     response:
 45 |       body:
 46 |         string: !!binary |
 47 |           H4sIAAAAAAAAA7RTwYrbMBS8+yvEOyfL2ma7xLel9NRDW1rKQl2MIr3Y2sp6QnqG7Ib8e5ETxw67
 48 |           hR7aiw8zb8YzetIhEwKMhkqA6iSr3tv1g3z8+P3xc/fu5Ss9Df2nb1+GZ958kPt98RJglRS0fULF
 49 |           k+pGUe8tsiF3olVAyZhc8/uyLO7zYpOPRE8abZK1ntflzd2ah7Cl9W1e3J2VHRmFESrxIxNCiMP4
 50 |           TRmdxj1U4nY1IT3GKFuE6jIkBASyCQEZo4ksHcNqJhU5RjfGPtTgZI81VKKG91YOGmtYiRpkO4L5
 51 |           cSkMuBuiTMHdYO0ZP16SWGp9oG088xd8Z5yJXRNQRnLpr5HJQ7YQv6qX/6t6LkFvlpyoqWnt/nfX
 52 |           TIif43aHq0bgA/WeG6Zf6JLhpjzZwXyfZrI8bx6YWNoZz4tJdWXXaGRpbFycHyipOtSzdL5LctCG
 53 |           FsRyR6/TvOV9Km5c+zf2M6EUekbd+IDaqOvG81jA9Nz+NHY55DEwxOfI2Dc741oMPpjxRoy7PGa/
 54 |           AQAA//8DAL4bR47vAwAA
 55 |       headers:
 56 |         CF-Cache-Status:
 57 |           - DYNAMIC
 58 |         CF-RAY:
 59 |           - 8ec799405a7ecfac-SJC
 60 |         Connection:
 61 |           - keep-alive
 62 |         Content-Encoding:
 63 |           - gzip
 64 |         Content-Type:
 65 |           - application/json
 66 |         Date:
 67 |           - Wed, 04 Dec 2024 00:14:51 GMT
 68 |         Server:
 69 |           - cloudflare
 70 |         Set-Cookie:
 71 |           - __cf_bm=br87AQInkCnSV_I9MXX5tYGv6_ZP_82Htl2IQun7srQ-1733271291-1.0.1.1-.r_ewngzuQkAkcKmG5atHV1LISuUrs2yVGfkZp0pxbuZa00Mqp.aWv.QYORcyr6VriqkQoJnjfJY99tvrd7rKw;
 72 |             path=/; expires=Wed, 04-Dec-24 00:44:51 GMT; domain=.api.openai.com; HttpOnly;
 73 |             Secure; SameSite=None
 74 |           - _cfuvid=_yXi1Uk8mQKkHMlntTwGtMye1ID9VJRq.3psfLHacuU-1733271291921-0.0.1.1-604800000;
 75 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 76 |         Transfer-Encoding:
 77 |           - chunked
 78 |         X-Content-Type-Options:
 79 |           - nosniff
 80 |         access-control-expose-headers:
 81 |           - X-Request-ID
 82 |         alt-svc:
 83 |           - h3=":443"; ma=86400
 84 |         openai-organization:
 85 |           - future-house-xr4tdh
 86 |         openai-processing-ms:
 87 |           - "268"
 88 |         openai-version:
 89 |           - "2020-10-01"
 90 |         strict-transport-security:
 91 |           - max-age=31536000; includeSubDomains; preload
 92 |         x-ratelimit-limit-requests:
 93 |           - "12000"
 94 |         x-ratelimit-limit-tokens:
 95 |           - "1000000"
 96 |         x-ratelimit-remaining-requests:
 97 |           - "11999"
 98 |         x-ratelimit-remaining-tokens:
 99 |           - "999894"
100 |         x-ratelimit-reset-requests:
101 |           - 5ms
102 |         x-ratelimit-reset-tokens:
103 |           - 6ms
104 |         x-request-id:
105 |           - req_2d64ba6207682b9086d527ac85f85959
106 |       status:
107 |         code: 200
108 |         message: OK
109 | version: 1
110 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestMultipleCompletionLLMModel.test_output_schema[structured-outputs].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages":[{"role":"user","content":"My name is Claude and I am 1 year
  5 |         old. What is my name and age?"}],"model":"gpt-4o","n":2,"response_format":{"type":"json_schema","json_schema":{"strict":true,"schema":{"properties":{"name":{"title":"Name","type":"string"},"age":{"title":"Age","type":"integer"}},"required":["name","age"],"title":"DummyOutputSchema","type":"object","additionalProperties":false},"name":"DummyOutputSchema"}}}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "431"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.55.3
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.55.3
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAA9xTTW+cMBS88yusd4YK2CgQbv26VZWiHpqoVOit/Zb1rrEt20iNVvvfK7NkIUoi
 45 |           9dwLh5k3w4z9fEoYAymgYcD3GPhgVfYRH34+Fsd79+U7Hp5+0P2nb1usvx6OD/SoIY0Ksz0QD8+q
 46 |           D9wMVlGQZqa5IwwUXYtqsymrMt/UEzEYQSrKehuyG5OVeXmT5XWW387CvZGcPDTsV8IYY6fpGyNq
 47 |           QX+gYXn6jAzkPfYEzXWIMXBGRQTQe+kD6gDpQnKjA+kp9akFjQO10LTwWeEoqIW0BewjVJzXKke7
 48 |           0WMMrUelZvx8jaFMb53Z+pm/4juppd93jtAbHX/pg7GQrMSvuhX/Q7eEsd/TVY4vGoB1ZrChC+ZI
 49 |           OhpWdxc7WHZnIYt6JoMJqBb8rkrfcOsEBZTKr44LOPI9iUW57A2OQpoVsb6S12He8r70lrr/F/uF
 50 |           4JxsINFZR0Lyl4WXMUfxZb03dj3jKTD4Jx9o6HZS9+Ssk5cF2Nmu3hSU31aiLiE5J38BAAD//wMA
 51 |           vVnbbuUDAAA=
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 8ec7ab7fe966aaa5-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Wed, 04 Dec 2024 00:27:19 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=5AuGimsg2FH0ntBI.jKIdG9P._9c78WMhN9jaiVQGeM-1733272039-1.0.1.1-F92PupP7R_e1Usesjv3KlZUrgLh73lB5LXJjilxG5ZwkFDrI1tOZsZp0zhC5gY.WjprQpIckFtJxWsiUNww0kw;
 69 |             path=/; expires=Wed, 04-Dec-24 00:57:19 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=.1wBj_f8n7gG1Go8qdTIwKV7Pk8XaH9yfTumfoAGccU-1733272039104-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         openai-organization:
 82 |           - future-house-xr4tdh
 83 |         openai-processing-ms:
 84 |           - "610"
 85 |         openai-version:
 86 |           - "2020-10-01"
 87 |         strict-transport-security:
 88 |           - max-age=31536000; includeSubDomains; preload
 89 |         x-ratelimit-limit-requests:
 90 |           - "10000"
 91 |         x-ratelimit-limit-tokens:
 92 |           - "30000000"
 93 |         x-ratelimit-remaining-requests:
 94 |           - "9999"
 95 |         x-ratelimit-remaining-tokens:
 96 |           - "29999951"
 97 |         x-ratelimit-reset-requests:
 98 |           - 6ms
 99 |         x-ratelimit-reset-tokens:
100 |           - 0s
101 |         x-request-id:
102 |           - req_86d20ee0ac20474675168c7b0c693f02
103 |       status:
104 |         code: 200
105 |         message: OK
106 | version: 1
107 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestMultipleCompletionLLMModel.test_text_image_message[gpt-4o-mini-2024-07-18].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": [{"type": "image_url", "image_url":
  5 |         {"url": "data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAACAAAAAgCAIAAAD8GO2jAAAAKElEQVR4nO3NMQEAAAjDMMC/ZzDBvlRA01vZJvwHAAAAAAAAAAAAbx2jxAE/i2AjOgAAAABJRU5ErkJggg=="}},
  6 |         {"type": "text", "text": "What color is this square? Respond only with the color
  7 |         name."}]}], "model": "gpt-4o-mini-2024-07-18", "n": 2}'
  8 |       headers:
  9 |         accept:
 10 |           - application/json
 11 |         accept-encoding:
 12 |           - gzip, deflate
 13 |         connection:
 14 |           - keep-alive
 15 |         content-length:
 16 |           - "381"
 17 |         content-type:
 18 |           - application/json
 19 |         host:
 20 |           - api.openai.com
 21 |         user-agent:
 22 |           - AsyncOpenAI/Python 1.54.3
 23 |         x-stainless-arch:
 24 |           - arm64
 25 |         x-stainless-async:
 26 |           - async:asyncio
 27 |         x-stainless-lang:
 28 |           - python
 29 |         x-stainless-os:
 30 |           - MacOS
 31 |         x-stainless-package-version:
 32 |           - 1.54.3
 33 |         x-stainless-raw-response:
 34 |           - "true"
 35 |         x-stainless-retry-count:
 36 |           - "1"
 37 |         x-stainless-runtime:
 38 |           - CPython
 39 |         x-stainless-runtime-version:
 40 |           - 3.12.7
 41 |       method: POST
 42 |       uri: https://api.openai.com/v1/chat/completions
 43 |     response:
 44 |       body:
 45 |         string: !!binary |
 46 |           H4sIAAAAAAAAA9STP0/DMBDF93wKy3ODmtA/IRszWxkQQihy7GticHyWz5WKqn535DRtUhUkVpYM
 47 |           97v38nxnHxLGuFa8ZFy2IsjOmfRx86xyp572+FL715pq7ZCKtqOVssRnUYH1B8hwVt1J7JyBoNGe
 48 |           sPQgAkTXbH2fZfMiXxU96FCBibLGhXSBaaetTvN5vkjn6zQrBnWLWgLxkr0ljDF26L8xp1Ww5yWb
 49 |           z86VDohEA7y8NDHGPZpY4YJIUxA28NkIJdoAto++ATUlHrY7EjGd3Rkz1I+XXxlsnMeaBn6pb7XV
 50 |           1FYeBKGNthTQ8WQivsmf/Zf8CWPv/Up2Vym589i5UAX8BBsNi2U+7ISPV2HE+cACBmGuVGdyZVgp
 51 |           CEIbmkyFSyFbUKN2vAJipzROwHTyt2l+8j4dXdvmL/YjkBJcAFU5D0rL6xOPbR7iS/mt7TLmPjCn
 52 |           LwrQVVttG/DO69Oet656qNdFvcrkMufJMfkGAAD//wMAhyjYPLUDAAA=
 53 |       headers:
 54 |         CF-Cache-Status:
 55 |           - DYNAMIC
 56 |         CF-RAY:
 57 |           - 8df9510e7fa3172e-SJC
 58 |         Connection:
 59 |           - keep-alive
 60 |         Content-Encoding:
 61 |           - gzip
 62 |         Content-Type:
 63 |           - application/json
 64 |         Date:
 65 |           - Fri, 08 Nov 2024 23:24:29 GMT
 66 |         Server:
 67 |           - cloudflare
 68 |         Transfer-Encoding:
 69 |           - chunked
 70 |         X-Content-Type-Options:
 71 |           - nosniff
 72 |         access-control-expose-headers:
 73 |           - X-Request-ID
 74 |         alt-svc:
 75 |           - h3=":443"; ma=86400
 76 |         openai-organization:
 77 |           - future-house-xr4tdh
 78 |         openai-processing-ms:
 79 |           - "1964"
 80 |         openai-version:
 81 |           - "2020-10-01"
 82 |         strict-transport-security:
 83 |           - max-age=31536000; includeSubDomains; preload
 84 |         x-ratelimit-limit-input-images:
 85 |           - "50000"
 86 |         x-ratelimit-limit-requests:
 87 |           - "30000"
 88 |         x-ratelimit-limit-tokens:
 89 |           - "150000000"
 90 |         x-ratelimit-remaining-input-images:
 91 |           - "49999"
 92 |         x-ratelimit-remaining-requests:
 93 |           - "29999"
 94 |         x-ratelimit-remaining-tokens:
 95 |           - "149999187"
 96 |         x-ratelimit-reset-input-images:
 97 |           - 1ms
 98 |         x-ratelimit-reset-requests:
 99 |           - 2ms
100 |         x-ratelimit-reset-tokens:
101 |           - 0s
102 |         x-request-id:
103 |           - req_7823d27f0ca9fc3fefbc0261333d26e3
104 |       status:
105 |         code: 200
106 |         message: OK
107 | version: 1
108 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestNoToolsSimpleAgent.test_dummyenv[claude-3-5-haiku-20241022].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"model": "claude-3-5-haiku-20241022", "messages": [{"role": "user", "content":
 5 |         [{"type": "text", "text": "Write a 5 word story via print_story"}]}], "temperature":
 6 |         0.1, "max_tokens": 4096}'
 7 |       headers:
 8 |         accept:
 9 |           - application/json
10 |         accept-encoding:
11 |           - gzip, deflate
12 |         anthropic-version:
13 |           - "2023-06-01"
14 |         connection:
15 |           - keep-alive
16 |         content-length:
17 |           - "189"
18 |         content-type:
19 |           - application/json
20 |         host:
21 |           - api.anthropic.com
22 |         user-agent:
23 |           - litellm/1.59.5
24 |       method: POST
25 |       uri: https://api.anthropic.com/v1/messages
26 |     response:
27 |       body:
28 |         string: !!binary |
29 |           H4sIAAAAAAAAAwAAAP//ZJAxb9wwDIX/CsGlCeAL7twc0GprpgwZMnRqXdiqRNtqHNIRqbTG4f57
30 |           YTcBEnQi8N6nx0edMEV0+KhDuz/cfAv3862PdT/yz+V64frL/U3CCm2ZaaVI1Q+EFWaZVsGrJjXP
31 |           hhU+SqQJHYbJl0i7j7vjbvTpoezqfX192Nc1VhiEjdjQfT+9Zhr9WV9vw+EtZfqg4OG4+y05gprk
32 |           BYomHsBGgm7Oia3d5A76wsGSsGu44a7r5sVG4YYj9fAGvLh0DQPAP+2iwTtRg0meCXopHMEPPjGY
33 |           RL9cNXi5Za2RX8ekEIRDUnqpomUYSG2tyD5nb+mZQHrIFISZtjrgOcIoM0Fi+FXUoF+p9SC9wvOP
34 |           CtVkbjN5FUaHxLG1khlfDKWnQhwIHZdpqrBsn+5OmHgu1po8ECu6w6cKgw8jtSGTXxe374H9q5/J
35 |           x/89KfZWOX4+n/8CAAD//wMA4xURPQ4CAAA=
36 |       headers:
37 |         CF-RAY:
38 |           - 9093f64fdef02302-SJC
39 |         Connection:
40 |           - keep-alive
41 |         Content-Encoding:
42 |           - gzip
43 |         Content-Type:
44 |           - application/json
45 |         Date:
46 |           - Tue, 28 Jan 2025 21:09:13 GMT
47 |         Server:
48 |           - cloudflare
49 |         Transfer-Encoding:
50 |           - chunked
51 |         X-Robots-Tag:
52 |           - none
53 |         anthropic-ratelimit-input-tokens-limit:
54 |           - "5000000"
55 |         anthropic-ratelimit-input-tokens-remaining:
56 |           - "5000000"
57 |         anthropic-ratelimit-input-tokens-reset:
58 |           - "2025-01-28T21:09:12Z"
59 |         anthropic-ratelimit-output-tokens-limit:
60 |           - "1000000"
61 |         anthropic-ratelimit-output-tokens-remaining:
62 |           - "1000000"
63 |         anthropic-ratelimit-output-tokens-reset:
64 |           - "2025-01-28T21:09:13Z"
65 |         anthropic-ratelimit-requests-limit:
66 |           - "5000"
67 |         anthropic-ratelimit-requests-remaining:
68 |           - "4999"
69 |         anthropic-ratelimit-requests-reset:
70 |           - "2025-01-28T21:09:12Z"
71 |         anthropic-ratelimit-tokens-limit:
72 |           - "6000000"
73 |         anthropic-ratelimit-tokens-remaining:
74 |           - "6000000"
75 |         anthropic-ratelimit-tokens-reset:
76 |           - "2025-01-28T21:09:12Z"
77 |         cf-cache-status:
78 |           - DYNAMIC
79 |         request-id:
80 |           - req_015KajCSj3bs81Latrp75Lv6
81 |         via:
82 |           - 1.1 google
83 |       status:
84 |         code: 200
85 |         message: OK
86 | version: 1
87 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestNoToolsSimpleAgent.test_dummyenv[claude-3-haiku-20240307].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"model": "claude-3-haiku-20240307", "messages": [{"role": "user", "content":
 5 |         [{"type": "text", "text": "Write a 5 word story via print_story"}]}], "temperature":
 6 |         0.1, "max_tokens": 4096}'
 7 |       headers:
 8 |         accept:
 9 |           - application/json
10 |         accept-encoding:
11 |           - gzip, deflate
12 |         anthropic-version:
13 |           - "2023-06-01"
14 |         connection:
15 |           - keep-alive
16 |         content-length:
17 |           - "187"
18 |         content-type:
19 |           - application/json
20 |         host:
21 |           - api.anthropic.com
22 |         user-agent:
23 |           - litellm/1.57.0
24 |       method: POST
25 |       uri: https://api.anthropic.com/v1/messages
26 |     response:
27 |       body:
28 |         string: !!binary |
29 |           H4sIAAAAAAAAA2SPT0sDMRDFv0qYk0Iq238oObZFevIg6kFXQtxMt2mzkzUzoS2l311aFBRPj3m/
30 |           Nw/eEYIHAx23thrOeLZ9bR+e+vki7Cbzx+XLYnq/AQ1y6PGcQmbXImjIKZ4NxxxYHAlo6JLHCAaa
31 |           6IrHwXiwdmFbBqNqNKnG1S1oaBIJkoB5O/40Cu7PvxcxsMSMKrByaqp2KXvFkvLB1FRTnwOJvdxX
32 |           NTwT7ntsBL3apJIJD1oVWqXcooj7iKg67FIOyFrFsMKYqFWrHJA8r0N/U8M1nN41sKTeZnScCAwg
33 |           eSslE3wDxs+C1CAYKjFqKJfx5giB+iJW0haJwQzvNDSuWaNtMjoJiezfQPXDMzr/n6Uiv53x8HT6
34 |           AgAA//8DADKg2IOWAQAA
35 |       headers:
36 |         CF-Cache-Status:
37 |           - DYNAMIC
38 |         CF-RAY:
39 |           - 905a90659e5cf9d4-SJC
40 |         Connection:
41 |           - keep-alive
42 |         Content-Encoding:
43 |           - gzip
44 |         Content-Type:
45 |           - application/json
46 |         Date:
47 |           - Tue, 21 Jan 2025 21:58:10 GMT
48 |         Server:
49 |           - cloudflare
50 |         Transfer-Encoding:
51 |           - chunked
52 |         X-Robots-Tag:
53 |           - none
54 |         anthropic-ratelimit-input-tokens-limit:
55 |           - "5000000"
56 |         anthropic-ratelimit-input-tokens-remaining:
57 |           - "5000000"
58 |         anthropic-ratelimit-input-tokens-reset:
59 |           - "2025-01-21T21:58:09Z"
60 |         anthropic-ratelimit-output-tokens-limit:
61 |           - "1000000"
62 |         anthropic-ratelimit-output-tokens-remaining:
63 |           - "1000000"
64 |         anthropic-ratelimit-output-tokens-reset:
65 |           - "2025-01-21T21:58:09Z"
66 |         anthropic-ratelimit-requests-limit:
67 |           - "5000"
68 |         anthropic-ratelimit-requests-remaining:
69 |           - "4999"
70 |         anthropic-ratelimit-requests-reset:
71 |           - "2025-01-21T21:58:09Z"
72 |         anthropic-ratelimit-tokens-limit:
73 |           - "6000000"
74 |         anthropic-ratelimit-tokens-remaining:
75 |           - "6000000"
76 |         anthropic-ratelimit-tokens-reset:
77 |           - "2025-01-21T21:58:09Z"
78 |         request-id:
79 |           - req_01WUTufxQjbhVVuJMS56CsLC
80 |         via:
81 |           - 1.1 google
82 |       status:
83 |         code: 200
84 |         message: OK
85 | version: 1
86 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestNoToolsSimpleAgent.test_dummyenv[gpt-4o-mini-2024-07-18].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "Write a 5 word story via print_story"}],
  5 |         "model": "gpt-4o-mini-2024-07-18", "n": 1, "temperature": 0.1}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "146"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.59.3
 21 |         x-stainless-arch:
 22 |           - arm64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - MacOS
 29 |         x-stainless-package-version:
 30 |           - 1.59.3
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.12.7
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAAwAAAP//jFJNT+MwEL3nV1g+J6gNpYHedi+LgOsuWhCKXHuSenE8lmfCh1D/+8pJ
 45 |           2xQBEpcc3pv38t543jIhpDVyJaTeKNZdcMUP+vX3/C68PBt1dnd57dwfvo1XvzH8bCnIPClw/Q80
 46 |           71UnGrvggC36kdYRFENynVen1eJiubwoB6JDAy7J2sDFAovOeluUs3JRzKpifr5Tb9BqILkS95kQ
 47 |           QrwN35TTG3iRKzHL90gHRKoFuToMCSEjuoRIRWSJlWeZT6RGz+CH6DdILB7hNRcGMYoGIzxBFNoh
 48 |           gTk5FkVoelIpuO+d2+HbQwqHbYi4ph1/wBvrLW3qCIrQpz8SY5ADu82EeBja9u8KyBCxC1wzPoJP
 49 |           hvPlaCenHU9kteMYWbkJLk/zT8xqA6yso6NlSa30BsyknDaremPxiMiOKn/M8pn3WNv69jv2E6E1
 50 |           BAZThwjG6vd9p7EI6QC/GjuseAgsCeKT1VCzhZiewUCjejeehaRXYujqxvoWYoh2vI0m1FUJplLr
 51 |           s4WW2Tb7DwAA//8DALVhDRgpAwAA
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 905a9069eaafebe9-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Tue, 21 Jan 2025 21:58:12 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=2dYW.ZjJiarII_MAmJyoaMr3FRfPWBOFDGojtrktaCY-1737496692-1.0.1.1-XP4CYYKfgXRJujlYOUGIPtWWH6aJ0jLgiPgiYT46.vTw0mR_5bWClcm4Hw_M9oTWb8KKJVyoyLfto3RLRGJMug;
 69 |             path=/; expires=Tue, 21-Jan-25 22:28:12 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=cKqI45QiSqB042Gew1XZbNwSC3TvNkhGer1N8m9zLbc-1737496692594-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         openai-organization:
 82 |           - future-house-xr4tdh
 83 |         openai-processing-ms:
 84 |           - "940"
 85 |         openai-version:
 86 |           - "2020-10-01"
 87 |         strict-transport-security:
 88 |           - max-age=31536000; includeSubDomains; preload
 89 |         x-ratelimit-limit-requests:
 90 |           - "30000"
 91 |         x-ratelimit-limit-tokens:
 92 |           - "150000000"
 93 |         x-ratelimit-remaining-requests:
 94 |           - "29999"
 95 |         x-ratelimit-remaining-tokens:
 96 |           - "149999973"
 97 |         x-ratelimit-reset-requests:
 98 |           - 2ms
 99 |         x-ratelimit-reset-tokens:
100 |           - 0s
101 |         x-request-id:
102 |           - req_19dbe433a04699f46315a7af746c0386
103 |       status:
104 |         code: 200
105 |         message: OK
106 | version: 1
107 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestSimpleAgent.test_agent_grad[claude-3-5-haiku-20241022].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"model": "claude-3-5-haiku-20241022", "messages": [{"role": "user", "content":
 5 |         [{"type": "text", "text": "Write a 5 word story via print_story"}]}], "temperature":
 6 |         0.1, "max_tokens": 4096, "tools": [{"name": "print_story", "input_schema": {"type":
 7 |         "object", "properties": {"story": {"description": "Story to print.", "title":
 8 |         "Story", "type": "string"}}, "required": ["story"]}, "description": "Print a
 9 |         story."}, {"name": "cast_float", "input_schema": {"type": "object", "properties":
10 |         {"x": {"title": "X", "type": "string"}}, "required": ["x"]}, "description":
11 |         "Cast the input argument x to a float."}, {"name": "cast_int", "input_schema":
12 |         {"type": "object", "properties": {"x": {"title": "X", "type": "number"}}, "required":
13 |         ["x"]}, "description": "Cast the input argument x to an integer."}], "tool_choice":
14 |         {"type": "any"}}'
15 |       headers:
16 |         accept:
17 |           - application/json
18 |         accept-encoding:
19 |           - gzip, deflate
20 |         anthropic-version:
21 |           - "2023-06-01"
22 |         connection:
23 |           - keep-alive
24 |         content-length:
25 |           - "827"
26 |         content-type:
27 |           - application/json
28 |         host:
29 |           - api.anthropic.com
30 |         user-agent:
31 |           - litellm/1.59.5
32 |       method: POST
33 |       uri: https://api.anthropic.com/v1/messages
34 |     response:
35 |       body:
36 |         string: !!binary |
37 |           H4sIAAAAAAAAA2RPy2rDMBD8FbNnu9jK46BjS2kJOTSFUHApQpG3joisda1Vm2D870UJgYYed147
38 |           M4JtQEIXWlVWC2Fi9bp5PD5Xb5t6tez1Z7UmyIFPPSYVhqBbhBwGcgnQIdjA2jPk0FGDDiQYp2OD
39 |           xaxYFHttD7EQpZhXpRCQgyHP6Bnk+3jNZCKnYkih5ybpjqqsnnY/dc223m5f7vWhFctu9TBLGV53
40 |           ydcP1rMKTMMpWX0fGeQIF0DCmr4x2zmiDpvM+ix6PPZoGJssWIfe4B1M00eeDL0aUAfyt23ORMCv
41 |           mMQgfXQuh3jeL8fLQ8V0QB9ALpYiB6PNHpUZULMlr24V5ZUfUDf/OYr8F5nPpukXAAD//wMANKfE
42 |           mZoBAAA=
43 |       headers:
44 |         CF-RAY:
45 |           - 9093f64eef9f7e2d-SJC
46 |         Connection:
47 |           - keep-alive
48 |         Content-Encoding:
49 |           - gzip
50 |         Content-Type:
51 |           - application/json
52 |         Date:
53 |           - Tue, 28 Jan 2025 21:09:14 GMT
54 |         Server:
55 |           - cloudflare
56 |         Transfer-Encoding:
57 |           - chunked
58 |         X-Robots-Tag:
59 |           - none
60 |         anthropic-ratelimit-input-tokens-limit:
61 |           - "5000000"
62 |         anthropic-ratelimit-input-tokens-remaining:
63 |           - "5000000"
64 |         anthropic-ratelimit-input-tokens-reset:
65 |           - "2025-01-28T21:09:13Z"
66 |         anthropic-ratelimit-output-tokens-limit:
67 |           - "1000000"
68 |         anthropic-ratelimit-output-tokens-remaining:
69 |           - "1000000"
70 |         anthropic-ratelimit-output-tokens-reset:
71 |           - "2025-01-28T21:09:14Z"
72 |         anthropic-ratelimit-requests-limit:
73 |           - "5000"
74 |         anthropic-ratelimit-requests-remaining:
75 |           - "4997"
76 |         anthropic-ratelimit-requests-reset:
77 |           - "2025-01-28T21:09:12Z"
78 |         anthropic-ratelimit-tokens-limit:
79 |           - "6000000"
80 |         anthropic-ratelimit-tokens-remaining:
81 |           - "6000000"
82 |         anthropic-ratelimit-tokens-reset:
83 |           - "2025-01-28T21:09:13Z"
84 |         cf-cache-status:
85 |           - DYNAMIC
86 |         request-id:
87 |           - req_01ACKBwLEvWvcDqXyBCXrFBj
88 |         via:
89 |           - 1.1 google
90 |       status:
91 |         code: 200
92 |         message: OK
93 | version: 1
94 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestSimpleAgent.test_agent_grad[claude-3-haiku-20240307].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"messages": [{"role": "user", "content": [{"type": "text", "text": "Write
 5 |         a 5 word story via print_story"}]}], "temperature": 0.1, "tools": [{"name":
 6 |         "print_story", "input_schema": {"type": "object", "properties": {"story": {"description":
 7 |         "Story to print.", "title": "Story", "type": "string"}}, "required": ["story"]},
 8 |         "description": "Print a story."}, {"name": "cast_float", "input_schema": {"type":
 9 |         "object", "properties": {"x": {"title": "X", "type": "string"}}, "required":
10 |         ["x"]}, "description": "Cast the input argument x to a float."}, {"name": "cast_int",
11 |         "input_schema": {"type": "object", "properties": {"x": {"title": "X", "type":
12 |         "number"}}, "required": ["x"]}, "description": "Cast the input argument x to
13 |         an integer."}], "tool_choice": {"type": "any"}, "max_tokens": 4096, "model":
14 |         "claude-3-haiku-20240307"}'
15 |       headers:
16 |         accept:
17 |           - application/json
18 |         accept-encoding:
19 |           - gzip, deflate
20 |         anthropic-version:
21 |           - "2023-06-01"
22 |         connection:
23 |           - keep-alive
24 |         content-length:
25 |           - "825"
26 |         content-type:
27 |           - application/json
28 |         host:
29 |           - api.anthropic.com
30 |         user-agent:
31 |           - litellm/1.52.3
32 |       method: POST
33 |       uri: https://api.anthropic.com/v1/messages
34 |     response:
35 |       body:
36 |         string: !!binary |
37 |           H4sIAAAAAAAAA1SQT0vDQBDFv0qY81bSRKvsTaV4qIh/KIoiYUnGNjaZjTsz0Rjy3WVbPPQ4b957
38 |           /Hgj1BVYaHlTpPPn/GG4UL7q85vVS/nUf+d1e9eBARk6jC5kdhsEA8E3UXDMNYsjAQOtr7ABC2Xj
39 |           tMJZPtu6eqezLM1O0zw9BwOlJ0ESsG/jf6N43xTKsXLPEW8t0vlj/UputbxdyC9ur5dc3vfrdg0G
40 |           yLUx14WapGDxYYhR6lTAjnAQLFxWPZJowJAw4o4TCehYA5rko6aKEyX86bAUrJJPr4FwOIFpejex
41 |           oSui2dMx3v7B+KVIJYIlbRoDup/DjgeCQvwOicGeLTIDXuVIm0/THwAAAP//AwAD26uSbQEAAA==
42 |       headers:
43 |         CF-Cache-Status:
44 |           - DYNAMIC
45 |         CF-RAY:
46 |           - 8df952260dedcfed-SJC
47 |         Connection:
48 |           - keep-alive
49 |         Content-Encoding:
50 |           - gzip
51 |         Content-Type:
52 |           - application/json
53 |         Date:
54 |           - Fri, 08 Nov 2024 23:25:13 GMT
55 |         Server:
56 |           - cloudflare
57 |         Transfer-Encoding:
58 |           - chunked
59 |         X-Robots-Tag:
60 |           - none
61 |         anthropic-ratelimit-requests-limit:
62 |           - "5000"
63 |         anthropic-ratelimit-requests-remaining:
64 |           - "4999"
65 |         anthropic-ratelimit-requests-reset:
66 |           - "2024-11-08T23:26:12Z"
67 |         anthropic-ratelimit-tokens-limit:
68 |           - "5000000"
69 |         anthropic-ratelimit-tokens-remaining:
70 |           - "5000000"
71 |         anthropic-ratelimit-tokens-reset:
72 |           - "2024-11-08T23:25:13Z"
73 |         request-id:
74 |           - req_01NDnvrz2u3MaKcf1cbQULuY
75 |         via:
76 |           - 1.1 google
77 |       status:
78 |         code: 200
79 |         message: OK
80 | version: 1
81 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestSimpleAgent.test_dummyenv[claude-3-5-haiku-20241022].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"model": "claude-3-5-haiku-20241022", "messages": [{"role": "user", "content":
 5 |         [{"type": "text", "text": "Write a 5 word story via print_story"}]}], "temperature":
 6 |         0.1, "max_tokens": 4096, "tools": [{"name": "print_story", "input_schema": {"type":
 7 |         "object", "properties": {"story": {"description": "Story to print.", "title":
 8 |         "Story", "type": "string"}}, "required": ["story"]}, "description": "Print a
 9 |         story."}, {"name": "cast_float", "input_schema": {"type": "object", "properties":
10 |         {"x": {"title": "X", "type": "string"}}, "required": ["x"]}, "description":
11 |         "Cast the input argument x to a float."}, {"name": "cast_int", "input_schema":
12 |         {"type": "object", "properties": {"x": {"title": "X", "type": "number"}}, "required":
13 |         ["x"]}, "description": "Cast the input argument x to an integer."}], "tool_choice":
14 |         {"type": "any"}}'
15 |       headers:
16 |         accept:
17 |           - application/json
18 |         accept-encoding:
19 |           - gzip, deflate
20 |         anthropic-version:
21 |           - "2023-06-01"
22 |         connection:
23 |           - keep-alive
24 |         content-length:
25 |           - "827"
26 |         content-type:
27 |           - application/json
28 |         host:
29 |           - api.anthropic.com
30 |         user-agent:
31 |           - litellm/1.59.5
32 |       method: POST
33 |       uri: https://api.anthropic.com/v1/messages
34 |     response:
35 |       body:
36 |         string: !!binary |
37 |           H4sIAAAAAAAAA2RPTWvCQBD9K2HOmxJjUmVvaqEXBW+FlrKsu4NGN7PJftjakP9eVhEqPc77mvcG
38 |           aDRwaP1eFJPVbPn2szi/XnZ6tXwJbrOpFvsNMAiXDpMKvZd7BAbOmgRI7xsfJAVg0FqNBjgoI6PG
39 |           fJrX+UE2p5iXRVlNirIEBspSQArAP4Z7ZrDWiOhT6LVJuqMoJvO6n/bv2yPSYa5mW9lX66/aAgOS
40 |           bfJ1rqEgfLDukqzUxQB8gBvAYW3PmO2MtS3qrKEsEn53qALqzDcGSeETjOMnS4ZOOJTe0mObK+Gx
41 |           j0kMnKIxDOJ1Px9uD0WwJyQPvH4uGSipDiiUQxkaS+JRUdx5h1L/52wMf5FqOo6/AAAA//8DAEbz
42 |           44eaAQAA
43 |       headers:
44 |         CF-Cache-Status:
45 |           - DYNAMIC
46 |         CF-RAY:
47 |           - 9093f64eed7ffa3e-SJC
48 |         Connection:
49 |           - keep-alive
50 |         Content-Encoding:
51 |           - gzip
52 |         Content-Type:
53 |           - application/json
54 |         Date:
55 |           - Tue, 28 Jan 2025 21:09:13 GMT
56 |         Server:
57 |           - cloudflare
58 |         Transfer-Encoding:
59 |           - chunked
60 |         X-Robots-Tag:
61 |           - none
62 |         anthropic-ratelimit-input-tokens-limit:
63 |           - "5000000"
64 |         anthropic-ratelimit-input-tokens-remaining:
65 |           - "5000000"
66 |         anthropic-ratelimit-input-tokens-reset:
67 |           - "2025-01-28T21:09:13Z"
68 |         anthropic-ratelimit-output-tokens-limit:
69 |           - "1000000"
70 |         anthropic-ratelimit-output-tokens-remaining:
71 |           - "1000000"
72 |         anthropic-ratelimit-output-tokens-reset:
73 |           - "2025-01-28T21:09:13Z"
74 |         anthropic-ratelimit-requests-limit:
75 |           - "5000"
76 |         anthropic-ratelimit-requests-remaining:
77 |           - "4998"
78 |         anthropic-ratelimit-requests-reset:
79 |           - "2025-01-28T21:09:12Z"
80 |         anthropic-ratelimit-tokens-limit:
81 |           - "6000000"
82 |         anthropic-ratelimit-tokens-remaining:
83 |           - "6000000"
84 |         anthropic-ratelimit-tokens-reset:
85 |           - "2025-01-28T21:09:13Z"
86 |         request-id:
87 |           - req_01RDaN9hSeKAcGKfk39icQK8
88 |         via:
89 |           - 1.1 google
90 |       status:
91 |         code: 200
92 |         message: OK
93 | version: 1
94 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestSimpleAgent.test_dummyenv[claude-3-haiku-20240307].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"messages": [{"role": "user", "content": [{"type": "text", "text": "Write
 5 |         a 5 word story via print_story"}]}], "temperature": 0.1, "tools": [{"name":
 6 |         "print_story", "input_schema": {"type": "object", "properties": {"story": {"description":
 7 |         "Story to print.", "title": "Story", "type": "string"}}, "required": ["story"]},
 8 |         "description": "Print a story."}, {"name": "cast_float", "input_schema": {"type":
 9 |         "object", "properties": {"x": {"title": "X", "type": "string"}}, "required":
10 |         ["x"]}, "description": "Cast the input argument x to a float."}, {"name": "cast_int",
11 |         "input_schema": {"type": "object", "properties": {"x": {"title": "X", "type":
12 |         "number"}}, "required": ["x"]}, "description": "Cast the input argument x to
13 |         an integer."}], "tool_choice": {"type": "any"}, "max_tokens": 4096, "model":
14 |         "claude-3-haiku-20240307"}'
15 |       headers:
16 |         accept:
17 |           - application/json
18 |         accept-encoding:
19 |           - gzip, deflate
20 |         anthropic-version:
21 |           - "2023-06-01"
22 |         connection:
23 |           - keep-alive
24 |         content-length:
25 |           - "825"
26 |         content-type:
27 |           - application/json
28 |         host:
29 |           - api.anthropic.com
30 |         user-agent:
31 |           - litellm/1.52.3
32 |       method: POST
33 |       uri: https://api.anthropic.com/v1/messages
34 |     response:
35 |       body:
36 |         string: !!binary |
37 |           H4sIAAAAAAAAA1SQW2vCQBCF/0qY57XES9u4b7UIUmihlF6klBCyo6aJs3FnRtSQ/15W6YOPc+ac
38 |           w8fpoHJgYcvrPB0ugmwW7275Os3aOpuc5ruv+mMKBuTYYnQhc7FGMBB8E4WCuWIpSMDA1jtswELZ
39 |           FOpwMB5siqrWwSgdTdJxeg8GSk+CJGC/u/9G8b7JlWPlmSPemqfD4dPuU1dvzy+zx3km+9Msmx+y
40 |           JRigYhtzbahIchYfjjFKrQrYDi6ChQe3RxINGBJGrDmRgAVrQJOsKnKcKOGhxVLQJb9eA+HxBvr+
41 |           x8SGNo9mT9d45wfjTpFKBEvaNAb0PIftLgS5+BqJwd7ejQx4lSst7fs/AAAA//8DAAk5Fe5tAQAA
42 |       headers:
43 |         CF-Cache-Status:
44 |           - DYNAMIC
45 |         CF-RAY:
46 |           - 8df950f8e8a49452-SJC
47 |         Connection:
48 |           - keep-alive
49 |         Content-Encoding:
50 |           - gzip
51 |         Content-Type:
52 |           - application/json
53 |         Date:
54 |           - Fri, 08 Nov 2024 23:24:25 GMT
55 |         Server:
56 |           - cloudflare
57 |         Transfer-Encoding:
58 |           - chunked
59 |         X-Robots-Tag:
60 |           - none
61 |         anthropic-ratelimit-requests-limit:
62 |           - "5000"
63 |         anthropic-ratelimit-requests-remaining:
64 |           - "4998"
65 |         anthropic-ratelimit-requests-reset:
66 |           - "2024-11-08T23:25:12Z"
67 |         anthropic-ratelimit-tokens-limit:
68 |           - "5000000"
69 |         anthropic-ratelimit-tokens-remaining:
70 |           - "5000000"
71 |         anthropic-ratelimit-tokens-reset:
72 |           - "2024-11-08T23:24:25Z"
73 |         request-id:
74 |           - req_014oiuUyG6RydFy6cCAKTi8Z
75 |         via:
76 |           - 1.1 google
77 |       status:
78 |         code: 200
79 |         message: OK
80 | version: 1
81 | 


--------------------------------------------------------------------------------
/tests/cassettes/TestSimpleAgent.test_hide_old_env_states.yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": ""}], "model": "gpt-4o-2024-08-06",
  5 |         "temperature": 0.1}'
  6 |       headers:
  7 |         accept:
  8 |           - application/json
  9 |         accept-encoding:
 10 |           - gzip, deflate
 11 |         connection:
 12 |           - keep-alive
 13 |         content-length:
 14 |           - "97"
 15 |         content-type:
 16 |           - application/json
 17 |         host:
 18 |           - api.openai.com
 19 |         user-agent:
 20 |           - AsyncOpenAI/Python 1.52.2
 21 |         x-stainless-arch:
 22 |           - x64
 23 |         x-stainless-async:
 24 |           - async:asyncio
 25 |         x-stainless-lang:
 26 |           - python
 27 |         x-stainless-os:
 28 |           - Linux
 29 |         x-stainless-package-version:
 30 |           - 1.52.2
 31 |         x-stainless-raw-response:
 32 |           - "true"
 33 |         x-stainless-retry-count:
 34 |           - "0"
 35 |         x-stainless-runtime:
 36 |           - CPython
 37 |         x-stainless-runtime-version:
 38 |           - 3.11.0rc1
 39 |       method: POST
 40 |       uri: https://api.openai.com/v1/chat/completions
 41 |     response:
 42 |       body:
 43 |         string: !!binary |
 44 |           H4sIAAAAAAAAA4xSwWrcMBC9+yumOq+Ld+PsdvdSQhNIQgkEAjmUYhRpbKuVNUIat92E/fcge3e9
 45 |           oSn0osN7857eG+YlAxBGiw0I1UpWnbf5xT1+/XJ59/ywmi/Kurs4C4+3Uf9qG3OlpZglBT39QMUH
 46 |           1UdFnbfIhtxIq4CSMbnOV2fFel6ul4uB6EijTbLGc15SvigWZV58yovlXtiSURjFBr5lAAAvw5si
 47 |           Oo1/xAaK2QHpMEbZoNgchwBEIJsQIWM0kaVjMZtIRY7RDamv0Vr6ANf0G5R0cAOjALbUA5OW28+n
 48 |           woB1H2XK7Xpr9/jumMRS4wM9xT1/xGvjTGyrgDKSS79GJi8GdpcBfB8a929KCB+o81wx/USXDFej
 49 |           m5g2PHHrPcfE0k7wfDl7x6vSyNLYeLIvoaRqUU/Kabmy14ZOiOyk8d9Z3vMeWxvX/I/9RCiFnlFX
 50 |           PqA26m3faSxgOr9/jR03PAQWcRsZu6o2rsHggxkvoPZVea7q81KjRJHtslcAAAD//wMAhkW/KQoD
 51 |           AAA=
 52 |       headers:
 53 |         CF-Cache-Status:
 54 |           - DYNAMIC
 55 |         CF-RAY:
 56 |           - 8de6e1adf9fbfb40-SJC
 57 |         Connection:
 58 |           - keep-alive
 59 |         Content-Encoding:
 60 |           - gzip
 61 |         Content-Type:
 62 |           - application/json
 63 |         Date:
 64 |           - Wed, 06 Nov 2024 17:42:42 GMT
 65 |         Server:
 66 |           - cloudflare
 67 |         Set-Cookie:
 68 |           - __cf_bm=IV1Bcm.OiOhx5Fueebsi7W6vfkykRRtCudT2Nx2Si.8-1730914962-1.0.1.1-gOxkIRQ2IVoWcd1Zz84mSVVwBHV5.OKb837EPZuheau5Qz5mzTUKUZbirerOuWHYGvTe3mf9h3oXoV6SISWa2Q;
 69 |             path=/; expires=Wed, 06-Nov-24 18:12:42 GMT; domain=.api.openai.com; HttpOnly;
 70 |             Secure; SameSite=None
 71 |           - _cfuvid=Cu15wqjKcy0EqDJ_H8EAhxyN9YVdxEDkGLA6vmynwxo-1730914962519-0.0.1.1-604800000;
 72 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
 73 |         Transfer-Encoding:
 74 |           - chunked
 75 |         X-Content-Type-Options:
 76 |           - nosniff
 77 |         access-control-expose-headers:
 78 |           - X-Request-ID
 79 |         alt-svc:
 80 |           - h3=":443"; ma=86400
 81 |         openai-organization:
 82 |           - future-house-xr4tdh
 83 |         openai-processing-ms:
 84 |           - "350"
 85 |         openai-version:
 86 |           - "2020-10-01"
 87 |         strict-transport-security:
 88 |           - max-age=31536000; includeSubDomains; preload
 89 |         x-ratelimit-limit-requests:
 90 |           - "10000"
 91 |         x-ratelimit-limit-tokens:
 92 |           - "30000000"
 93 |         x-ratelimit-remaining-requests:
 94 |           - "9999"
 95 |         x-ratelimit-remaining-tokens:
 96 |           - "29999983"
 97 |         x-ratelimit-reset-requests:
 98 |           - 6ms
 99 |         x-ratelimit-reset-tokens:
100 |           - 0s
101 |         x-request-id:
102 |           - req_654554dd6c32e59d7f3e4e0ff5dafa77
103 |       status:
104 |         code: 200
105 |         message: OK
106 | version: 1
107 | 


--------------------------------------------------------------------------------
/tests/cassettes/test_fallbacks_working[False].yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"messages":[{"role":"user","content":"Hello!"}],"model":"gpt-4o-mini","n":1,"tool_choice":"required","tools":[{"type":"function","function":{"name":"talk","description":"Say
 5 |         something to me.","parameters":{"type":"object","properties":{"message":{"description":"what
 6 |         you want to say","title":"Message","type":"string"}},"required":["message"]}}}]}'
 7 |       headers:
 8 |         accept:
 9 |           - application/json
10 |         accept-encoding:
11 |           - gzip, deflate
12 |         connection:
13 |           - keep-alive
14 |         content-length:
15 |           - "348"
16 |         content-type:
17 |           - application/json
18 |         host:
19 |           - api.openai.com
20 |         user-agent:
21 |           - AsyncOpenAI/Python 1.65.2
22 |         x-stainless-arch:
23 |           - arm64
24 |         x-stainless-async:
25 |           - async:asyncio
26 |         x-stainless-lang:
27 |           - python
28 |         x-stainless-os:
29 |           - MacOS
30 |         x-stainless-package-version:
31 |           - 1.65.2
32 |         x-stainless-raw-response:
33 |           - "true"
34 |         x-stainless-read-timeout:
35 |           - "60.0"
36 |         x-stainless-retry-count:
37 |           - "0"
38 |         x-stainless-runtime:
39 |           - CPython
40 |         x-stainless-runtime-version:
41 |           - 3.12.4
42 |       method: POST
43 |       uri: https://api.openai.com/v1/chat/completions
44 |     response:
45 |       body:
46 |         string:
47 |           "{\n    \"error\": {\n        \"message\": \"Incorrect API key provided:
48 |           abc123. You can find your API key at https://platform.openai.com/account/api-keys.\",\n
49 |           \       \"type\": \"invalid_request_error\",\n        \"param\": null,\n        \"code\":
50 |           \"invalid_api_key\"\n    }\n}\n"
51 |       headers:
52 |         CF-RAY:
53 |           - 93106ee58a25e9e1-LAX
54 |         Connection:
55 |           - keep-alive
56 |         Content-Length:
57 |           - "256"
58 |         Content-Type:
59 |           - application/json; charset=utf-8
60 |         Date:
61 |           - Wed, 16 Apr 2025 03:00:34 GMT
62 |         Server:
63 |           - cloudflare
64 |         Set-Cookie:
65 |           - __cf_bm=fno7x_jxANnm27vgnNYNxHE09oaBaF..5rUNTsRQ1WI-1744772434-1.0.1.1-rsmcL1TWF3LBc0flL7Kmdpy1VXvWhNk7QMMykdrKSZJ.bnFPZCzILfUcIZc6xZDGKuaUQwHRadfN6xtPvj4gkVo_4mM6lTZZPyrOWWDdmCg;
66 |             path=/; expires=Wed, 16-Apr-25 03:30:34 GMT; domain=.api.openai.com; HttpOnly;
67 |             Secure; SameSite=None
68 |           - _cfuvid=S6PXUFvHj99UvUnTDkwFAy45z3FyWDJESdzHk5S0Hy8-1744772434881-0.0.1.1-604800000;
69 |             path=/; domain=.api.openai.com; HttpOnly; Secure; SameSite=None
70 |         X-Content-Type-Options:
71 |           - nosniff
72 |         alt-svc:
73 |           - h3=":443"; ma=86400
74 |         cf-cache-status:
75 |           - DYNAMIC
76 |         strict-transport-security:
77 |           - max-age=31536000; includeSubDomains; preload
78 |         vary:
79 |           - Origin
80 |         x-request-id:
81 |           - req_aedfefa7d8f530b37b53effeaa97d3a0
82 |       status:
83 |         code: 401
84 |         message: Unauthorized
85 | version: 1
86 | 


--------------------------------------------------------------------------------
/tests/cassettes/test_reflect_module.yaml:
--------------------------------------------------------------------------------
 1 | interactions:
 2 |   - request:
 3 |       body:
 4 |         '{"messages": [{"role": "user", "content": [{"type": "text", "text": "<context>\n  I
 5 |         am happy. How do I feel?\n</context>\n<response>\n  You are sad.\n</response>"}]}],
 6 |         "temperature": 0, "system": [{"type": "text", "text": "Consider a proposed response
 7 |         based on context. Reflect on the response within <thought> tags then conclude
 8 |         with a possibly revised response within <final-response> tags."}], "max_tokens":
 9 |         4096, "model": "claude-3-haiku-20240307"}'
10 |       headers:
11 |         accept:
12 |           - application/json
13 |         accept-encoding:
14 |           - gzip, deflate
15 |         anthropic-version:
16 |           - "2023-06-01"
17 |         connection:
18 |           - keep-alive
19 |         content-length:
20 |           - "452"
21 |         content-type:
22 |           - application/json
23 |         host:
24 |           - api.anthropic.com
25 |         user-agent:
26 |           - litellm/1.52.3
27 |       method: POST
28 |       uri: https://api.anthropic.com/v1/messages
29 |     response:
30 |       body:
31 |         string: !!binary |
32 |           H4sIAAAAAAAAA3RRS2vcQAz+K0Ln2cTZFAJmyaU9lRxaWkJKXJaJR94ZYkuTkSabzbL/vdgk9AE9
33 |           Cb6nhI6YArY46W7bXNzdfN2/2sXNF3+In/np9tun10E+okM7ZJpVpOp3hA6LjDPgVZOaZ0OHkwQa
34 |           scV+9DXQ6nIVfXqsq3Wz/tBcNlfosBc2YsP2/vieaPQye5fR4sai1F20646/R4JCmoWVoMMfUsEX
35 |           AvWhQwhCCiwGk7c+gkWCJfvFIBd5ToGCg31MfQQ1b6Rg0duiy1RUGJJC9DkfzmAu8jkXySV5+6N0
36 |           L3UM8EBgMqcPqUz/jXHw4JUCCC9s4kHK5C0Jwy49E591vDn/fVzHmyGxH1fvZdcdzxcOROPbXrPh
37 |           Hw2efjpUk7wt5FUYWyQOW6uF8Y1QeqrEPWHLdRwd1uVd7RET52pbk0dixfZq7VCq/QU1p9MvAAAA
38 |           //8DAOX3hPEMAgAA
39 |       headers:
40 |         CF-Cache-Status:
41 |           - DYNAMIC
42 |         CF-RAY:
43 |           - 8df9510c597cceb1-SJC
44 |         Connection:
45 |           - keep-alive
46 |         Content-Encoding:
47 |           - gzip
48 |         Content-Type:
49 |           - application/json
50 |         Date:
51 |           - Fri, 08 Nov 2024 23:24:27 GMT
52 |         Server:
53 |           - cloudflare
54 |         Transfer-Encoding:
55 |           - chunked
56 |         X-Robots-Tag:
57 |           - none
58 |         anthropic-ratelimit-requests-limit:
59 |           - "5000"
60 |         anthropic-ratelimit-requests-remaining:
61 |           - "4999"
62 |         anthropic-ratelimit-requests-reset:
63 |           - "2024-11-08T23:25:12Z"
64 |         anthropic-ratelimit-tokens-limit:
65 |           - "5000000"
66 |         anthropic-ratelimit-tokens-remaining:
67 |           - "5000000"
68 |         anthropic-ratelimit-tokens-reset:
69 |           - "2024-11-08T23:24:27Z"
70 |         request-id:
71 |           - req_012qo7D67oQLZLHC1k3jXiiN
72 |         via:
73 |           - 1.1 google
74 |       status:
75 |         code: 200
76 |         message: OK
77 | version: 1
78 | 


--------------------------------------------------------------------------------
/tests/cassettes/test_rollout[False].yaml:
--------------------------------------------------------------------------------
  1 | interactions:
  2 |   - request:
  3 |       body:
  4 |         '{"messages": [{"role": "user", "content": "Hello!"}], "model": "gpt-4o-2024-08-06",
  5 |         "temperature": 0.1, "tool_choice": "required", "tools": [{"type": "function",
  6 |         "function": {"name": "talk", "description": "Say something to me.", "parameters":
  7 |         {"type": "object", "properties": {"message": {"description": "what you want
  8 |         to say", "title": "Message", "type": "string"}}, "required": ["message"]}}}]}'
  9 |       headers:
 10 |         accept:
 11 |           - application/json
 12 |         accept-encoding:
 13 |           - gzip, deflate
 14 |         connection:
 15 |           - keep-alive
 16 |         content-length:
 17 |           - "397"
 18 |         content-type:
 19 |           - application/json
 20 |         host:
 21 |           - api.openai.com
 22 |         user-agent:
 23 |           - AsyncOpenAI/Python 1.54.3
 24 |         x-stainless-arch:
 25 |           - arm64
 26 |         x-stainless-async:
 27 |           - async:asyncio
 28 |         x-stainless-lang:
 29 |           - python
 30 |         x-stainless-os:
 31 |           - MacOS
 32 |         x-stainless-package-version:
 33 |           - 1.54.3
 34 |         x-stainless-raw-response:
 35 |           - "true"
 36 |         x-stainless-retry-count:
 37 |           - "1"
 38 |         x-stainless-runtime:
 39 |           - CPython
 40 |         x-stainless-runtime-version:
 41 |           - 3.12.7
 42 |       method: POST
 43 |       uri: https://api.openai.com/v1/chat/completions
 44 |     response:
 45 |       body:
 46 |         string: !!binary |
 47 |           H4sIAAAAAAAAA4xTTY/aMBC951e4c4YqCbBALlUP1W4rdfupdndLFRl7EgyO7dpOF4T471USSAKl
 48 |           UnOIrHnz3sw8j/cBISA4JATYinpWGDl8/fkLn6x/bXfG3nx9eshvn/zv7M06pxt2/xEGFUMv18j8
 49 |           ifWS6cJI9EKrBmYWqcdKNZqOoiicxdOoBgrNUVa03PjhWA/jMB4Pw9kwvDkSV1owdJCQHwEhhOzr
 50 |           f9Wi4riFhISDU6RA52iOkLRJhIDVsooAdU44T5WHQQcyrTyqqmtVStkDvNYyZVTKrnDz7Xvnzicq
 51 |           ZTpePW/eL5fzcP59++72w6e1uo/y8vFbr14jvTN1Q1mpWOtPD2/jyUUxQkDRouZ6KjcXPEKA2rws
 52 |           UPmqZ9gvTn4sIFnAHUqpX5A7/UwYVeQtafwgO10SrzndvVrAAc4UD8G188+eSxaz0lF5tO8YP7T3
 53 |           IXVurF66C3shE0q4VWqRunrMvtvBqVpdB8qzCwVjdWF86vUGVSU7GTWi0K1bB8bxEfTaU9nFp5PB
 54 |           FbWUo6eivu92xRhlK+Qds1s1WnKhe0DQm/zvZq5pN9MLlf+PfAcwhsYjT41FLtj5wF2axeox/iut
 55 |           9bhuGNzOeSzSTKgcrbGifg+QmTSazPlsNI4Yg+AQ/AEAAP//AwAghIdTGAQAAA==
 56 |       headers:
 57 |         CF-Cache-Status:
 58 |           - DYNAMIC
 59 |         CF-RAY:
 60 |           - 8df95128e8da2386-SJC
 61 |         Connection:
 62 |           - keep-alive
 63 |         Content-Encoding:
 64 |           - gzip
 65 |         Content-Type:
 66 |           - application/json
 67 |         Date:
 68 |           - Fri, 08 Nov 2024 23:24:32 GMT
 69 |         Server:
 70 |           - cloudflare
 71 |         Transfer-Encoding:
 72 |           - chunked
 73 |         X-Content-Type-Options:
 74 |           - nosniff
 75 |         access-control-expose-headers:
 76 |           - X-Request-ID
 77 |         alt-svc:
 78 |           - h3=":443"; ma=86400
 79 |         openai-organization:
 80 |           - future-house-xr4tdh
 81 |         openai-processing-ms:
 82 |           - "423"
 83 |         openai-version:
 84 |           - "2020-10-01"
 85 |         strict-transport-security:
 86 |           - max-age=31536000; includeSubDomains; preload
 87 |         x-ratelimit-limit-requests:
 88 |           - "10000"
 89 |         x-ratelimit-limit-tokens:
 90 |           - "30000000"
 91 |         x-ratelimit-remaining-requests:
 92 |           - "9999"
 93 |         x-ratelimit-remaining-tokens:
 94 |           - "29999980"
 95 |         x-ratelimit-reset-requests:
 96 |           - 6ms
 97 |         x-ratelimit-reset-tokens:
 98 |           - 0s
 99 |         x-request-id:
100 |           - req_173cc061bfeb21f2b6fc27acf7f90100
101 |       status:
102 |         code: 200
103 |         message: OK
104 | version: 1
105 | 


--------------------------------------------------------------------------------
/tests/conftest.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import random
  3 | from typing import Any
  4 | 
  5 | import numpy as np
  6 | import pytest
  7 | import torch
  8 | from aviary.core import DummyEnv
  9 | from lmi import configure_llm_logs
 10 | 
 11 | from ldp.nn.handlers.transformer_handler import ExecutionMode, ParallelModeConfig
 12 | 
 13 | from . import CASSETTES_DIR
 14 | 
 15 | IN_GITHUB_ACTIONS: bool = os.getenv("GITHUB_ACTIONS") == "true"
 16 | 
 17 | 
 18 | @pytest.fixture(name="dummy_env")
 19 | def fixture_dummy_env() -> DummyEnv:
 20 |     return DummyEnv()
 21 | 
 22 | 
 23 | @pytest.fixture(scope="session", autouse=True)
 24 | def _fixture_set_up_environment() -> None:
 25 |     configure_llm_logs()
 26 | 
 27 | 
 28 | def set_seed(seed: int | None) -> None:
 29 |     if seed is None:
 30 |         return
 31 | 
 32 |     random.seed(seed)
 33 |     np.random.seed(seed)  # noqa: NPY002
 34 |     torch.manual_seed(seed)
 35 |     torch.cuda.manual_seed(seed)
 36 | 
 37 | 
 38 | @pytest.fixture(name="seed_zero")
 39 | def fixture_seed_zero() -> None:
 40 |     """Set a 0 seed to minimize the chances of test flakiness."""
 41 |     set_seed(0)
 42 | 
 43 | 
 44 | OPENAI_API_KEY_HEADER = "authorization"
 45 | ANTHROPIC_API_KEY_HEADER = "x-api-key"
 46 | # SEE: https://github.com/kevin1024/vcrpy/blob/v6.0.1/vcr/config.py#L43
 47 | VCR_DEFAULT_MATCH_ON = "method", "scheme", "host", "port", "path", "query"
 48 | 
 49 | 
 50 | @pytest.fixture(scope="session", name="vcr_config")
 51 | def fixture_vcr_config() -> dict[str, Any]:
 52 |     return {
 53 |         "filter_headers": [OPENAI_API_KEY_HEADER, ANTHROPIC_API_KEY_HEADER, "cookie"],
 54 |         "record_mode": "once",
 55 |         "match_on": ["method", "host", "path", "query"],
 56 |         "allow_playback_repeats": True,
 57 |         "cassette_library_dir": str(CASSETTES_DIR),
 58 |     }
 59 | 
 60 | 
 61 | ENABLED = {"true", "1", "yes"}
 62 | TEST_GPUS: bool = os.getenv("TEST_GPUS", "").lower() in ENABLED
 63 | TEST_SLURM: bool = os.getenv("TEST_SLURM", "").lower() in ENABLED
 64 | 
 65 | PARALLEL_MODE_CONFIGS = [
 66 |     pytest.param(None, id="cpu-only"),
 67 |     pytest.param(
 68 |         ParallelModeConfig(num_workers=2, num_cpus_per_worker=1),
 69 |         id="two-gpu",
 70 |         marks=pytest.mark.skipif(not TEST_GPUS, reason="Requires GPUs"),
 71 |     ),
 72 |     pytest.param(
 73 |         ParallelModeConfig(num_workers=2, num_cpus_per_worker=1, offload_cpu=True),
 74 |         id="two-gpu-offload",
 75 |         marks=pytest.mark.skipif(not TEST_GPUS, reason="Requires GPUs"),
 76 |     ),
 77 |     pytest.param(
 78 |         ParallelModeConfig(
 79 |             num_workers=2,
 80 |             num_cpus_per_worker=1,
 81 |             offload_cpu=True,
 82 |             activation_checkpointing=True,
 83 |             cpu_ram_efficient_loading=True,
 84 |         ),
 85 |         id="two-gpu-all-enabled",
 86 |         marks=pytest.mark.skipif(not TEST_GPUS, reason="Requires GPUs"),
 87 |     ),
 88 |     pytest.param(
 89 |         ParallelModeConfig(
 90 |             num_workers=2,
 91 |             num_cpus_per_worker=1,
 92 |             execution_mode=ExecutionMode.SLURM_CLUSTER,
 93 |         ),
 94 |         id="two-gpus-slurm",
 95 |         marks=pytest.mark.skipif(
 96 |             not TEST_GPUS or not TEST_SLURM, reason="Requires GPUs and SLURM"
 97 |         ),
 98 |     ),
 99 |     pytest.param(
100 |         ParallelModeConfig(
101 |             num_workers=2,
102 |             num_cpus_per_worker=1,
103 |             execution_mode=ExecutionMode.SLURM_CLUSTER,
104 |             offload_cpu=True,
105 |         ),
106 |         id="two-gpus-slurm-offload",
107 |         marks=pytest.mark.skipif(
108 |             not TEST_GPUS or not TEST_SLURM, reason="Requires GPUs and SLURM"
109 |         ),
110 |     ),
111 | ]
112 | 


--------------------------------------------------------------------------------
/tests/test_buffers.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | 
 3 | from ldp.alg.optimizer.replay_buffers import (
 4 |     CircularReplayBuffer,
 5 |     PrioritizedReplayBuffer,
 6 | )
 7 | 
 8 | 
 9 | @pytest.mark.asyncio
10 | async def test_circular_buffer() -> None:
11 |     buf = CircularReplayBuffer()
12 | 
13 |     samples = [{"state": 1, "action": 2, "reward": 3, "t": t} for t in range(5)]
14 |     buf += samples
15 |     buf.resize(3)  # should eject t=0, 1
16 |     assert {sample["t"] for sample in buf} == {2, 3, 4}
17 | 
18 |     await buf.prepare_for_sampling()
19 | 
20 |     # check we can iterate
21 |     next(buf.batched_iter(batch_size=3))
22 | 
23 |     # add a bad sample
24 |     buf.append({})
25 |     with pytest.raises(
26 |         RuntimeError, match="Found buffer element with inconsistent keys"
27 |     ):
28 |         next(buf.batched_iter(batch_size=4))
29 | 
30 |     buf.clear()
31 |     assert not buf, "Failed to clear data"
32 | 
33 | 
34 | async def _dummy_q_function(*args, **kwargs) -> float:  # noqa: ARG001, RUF029
35 |     return 1.0
36 | 
37 | 
38 | @pytest.mark.asyncio
39 | async def test_prioritized_buffer():
40 |     buf = PrioritizedReplayBuffer(alpha=1, ranked=False, q_function=_dummy_q_function)
41 | 
42 |     buf += [
43 |         {
44 |             "input_args": (),
45 |             "input_kwargs": {},
46 |             "discounted_return": -1.0 if t % 2 else 1.0,
47 |             "t": t,
48 |         }
49 |         for t in range(6)
50 |     ]
51 |     buf.resize(3)
52 | 
53 |     with pytest.raises(RuntimeError, match="TD errors not available"):
54 |         next(buf.batched_iter(batch_size=3))
55 | 
56 |     await buf.prepare_for_sampling()
57 | 
58 |     # check we can iterate
59 |     batch = next(buf.batched_iter(batch_size=3))
60 | 
61 |     # The odd timesteps should have priority because they have higher error
62 |     assert all(t % 2 for t in batch["t"])
63 | 


--------------------------------------------------------------------------------
/tests/test_loss_ops.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | import pytest
 3 | import torch
 4 | 
 5 | from ldp.graph import MSELossOp, compute_graph
 6 | 
 7 | 
 8 | @pytest.mark.asyncio
 9 | @pytest.mark.parametrize("input_size", [4, 10])
10 | @pytest.mark.parametrize("dtype", ["numpy", "torch"])
11 | async def test_embedding_op(input_size, dtype) -> None:
12 |     op = MSELossOp()
13 | 
14 |     # Generate data based on dtype
15 |     if dtype == "numpy":
16 |         rng = np.random.default_rng(12345)
17 |         prediction = rng.random(input_size)
18 |         target = rng.random(input_size)
19 |     else:
20 |         prediction = torch.rand(input_size)
21 |         target = torch.rand(input_size)
22 |     async with compute_graph():
23 |         op_result = await op(
24 |             prediction=prediction,
25 |             target=target,
26 |         )
27 | 
28 |     # Validate the output and grads
29 |     op_result.compute_grads()
30 |     grads = op.get_input_grads(op_result.call_id)
31 |     assert grads[0] == []
32 |     assert grads[1].keys() == {"prediction", "target"}
33 |     assert grads[1].get("target") is None
34 |     pred = grads[1].get("prediction")
35 |     if dtype == "numpy":
36 |         assert isinstance(pred, np.ndarray)
37 |         assert isinstance(op_result.value, float)
38 |     else:
39 |         assert isinstance(pred, torch.Tensor)
40 |         assert isinstance(op_result.value, torch.Tensor)
41 |     assert pred.shape == (input_size,)
42 | 


--------------------------------------------------------------------------------
/tests/test_memory.py:
--------------------------------------------------------------------------------
 1 | import pytest
 2 | from lmi import EmbeddingModel
 3 | from pytest_subtests import SubTests
 4 | 
 5 | from ldp.graph import Memory
 6 | from ldp.graph.memory import UIndexMemoryModel
 7 | 
 8 | 
 9 | @pytest.fixture(name="sample_memory")
10 | def fixture_sample_memory() -> Memory:
11 |     return Memory(
12 |         query="sample string representation", output="observation", value=42.0
13 |     )
14 | 
15 | 
16 | class TestUIndexMemoryModel:
17 |     def test_initialization_serialization(self, subtests: SubTests) -> None:
18 |         with subtests.test(msg="default-model-specified"):
19 |             model = UIndexMemoryModel()
20 |             assert isinstance(model.embedding_model, EmbeddingModel), (
21 |                 "Default embedding model should be set"
22 |             )
23 |             model.model_dump()  # Check we can serialize
24 | 
25 |         with subtests.test(msg="nondefault-model-specified"):
26 |             model_custom = UIndexMemoryModel(
27 |                 embedding_model=EmbeddingModel.from_name("text-embedding-3-small")
28 |             )
29 |             model_custom.model_dump()  # Check we can serialize
30 | 
31 |     @pytest.mark.asyncio
32 |     async def test_add_then_get_memory(self, sample_memory: Memory) -> None:
33 |         memory_model = UIndexMemoryModel(
34 |             embedding_model=EmbeddingModel.from_name("text-embedding-3-small")
35 |         )
36 |         async with memory_model.safe_access_index() as index:
37 |             assert len(index) == 0, "Should have no memories"
38 |         await memory_model.add_memory(sample_memory)
39 |         async with memory_model.safe_access_index() as index:
40 |             assert len(index) == 1, "Should have one memory"
41 |         assert memory_model.memories[0] == sample_memory
42 |         result = await memory_model.get_memory("sample query", matches=1)
43 |         assert len(result) == 1
44 |         assert result[0] == sample_memory
45 | 


--------------------------------------------------------------------------------
/tests/test_nn_ops.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | import pytest
 4 | from aviary.core import Message
 5 | 
 6 | import ldp.nn
 7 | from ldp.graph import OpResult
 8 | 
 9 | 
10 | class TestLocalLLMCallOp:
11 |     @pytest.mark.asyncio
12 |     async def test_batching_consistent_results(self):
13 |         """Tests that padding in batched calls does not affect the results (attention_mask is set correctly)."""
14 |         model_config = ldp.nn.LMConfig(
15 |             model="gpt2", device="cpu", dtype=ldp.nn.TorchDType.fp32
16 |         )
17 |         local_llm_call_op = ldp.nn.LocalLLMCallOp(
18 |             model_config, batch_size=2, max_wait_interval=1.0
19 |         )
20 | 
21 |         messages = [
22 |             Message(content=text)
23 |             for text in ("Hello, how are you?", "Hello, how are you?")
24 |         ]
25 | 
26 |         async def forward_batch() -> list[OpResult[Message]]:
27 |             return await asyncio.gather(*[
28 |                 local_llm_call_op([msg], temperature=1.0, max_new_tokens=10)
29 |                 for msg in messages
30 |             ])
31 | 
32 |         # First forward batch with seed set to 0
33 |         ldp.nn.set_seed(0)
34 |         results_first_call = await forward_batch()
35 | 
36 |         # Re-seed and forward batch again with padding to check for consistency
37 |         ldp.nn.set_seed(0)
38 |         messages[
39 |             -1
40 |         ].content = (
41 |             "Some very long text that would create lots of padding in the batch."
42 |         )
43 |         results_second_call = await forward_batch()
44 | 
45 |         assert len(results_first_call) == len(results_second_call), (
46 |             "Expected the number of results to match between the two calls."
47 |         )
48 |         assert results_first_call[0].value == results_second_call[0].value, (
49 |             "Expected the results to match between the two calls, but got differing"
50 |             " results."
51 |         )
52 | 


--------------------------------------------------------------------------------
/tests/test_prompts.py:
--------------------------------------------------------------------------------
 1 | import textwrap
 2 | 
 3 | from ldp.llms.prompts import indent_xml
 4 | 
 5 | 
 6 | def test_indent_xml():
 7 |     xml = "<root><child1>foo<child2>line1\nline2\nline3</child2></child1></root>"
 8 |     expected = textwrap.dedent(
 9 |         """\
10 |         <root>
11 |           <child1>
12 |             foo
13 |             <child2>
14 |               line1
15 |               line2
16 |               line3
17 |             </child2>
18 |           </child1>
19 |         </root>"""
20 |     )
21 |     assert indent_xml(xml) == expected
22 | 


--------------------------------------------------------------------------------
/tests/test_shims.py:
--------------------------------------------------------------------------------
 1 | import importlib
 2 | import os
 3 | from unittest.mock import patch
 4 | 
 5 | import ldp.shims
 6 | 
 7 | 
 8 | def test_tqdm_import() -> None:
 9 |     assert ldp.shims.tqdm.__module__ == "tqdm.std"
10 |     with patch.dict(os.environ, {"LDP_TQDM_USE_RICH": "1"}):
11 |         importlib.reload(ldp.shims)
12 |         assert ldp.shims.tqdm.__module__ == "tqdm.rich"
13 | 


--------------------------------------------------------------------------------
/tests/test_utils.py:
--------------------------------------------------------------------------------
 1 | from dataclasses import dataclass
 2 | from typing import Any
 3 | 
 4 | from ldp.utils import format_error_details
 5 | 
 6 | 
 7 | @dataclass
 8 | class MockResponse:
 9 |     status_code: int
10 |     _json: dict | None = None
11 |     _text: str = ""
12 | 
13 |     def json(self) -> dict[str, Any]:
14 |         if self._json is None:
15 |             raise ValueError("No JSON")
16 |         return self._json
17 | 
18 |     @property
19 |     def text(self) -> str:
20 |         return self._text
21 | 
22 | 
23 | class MockHTTPError(Exception):
24 |     def __init__(self, status_code: int, detail: str | None = None, text: str = ""):
25 |         self.response = MockResponse(
26 |             status_code=status_code,
27 |             _json={"detail": detail} if detail else None,
28 |             _text=text,
29 |         )
30 |         super().__init__(f"HTTP {status_code}")
31 | 
32 | 
33 | def test_format_basic_error():
34 |     error = ValueError("something went wrong")
35 |     details = format_error_details(error)
36 |     assert details == "something went wrong"
37 | 
38 | 
39 | def test_format_http_error_with_json():
40 |     error = MockHTTPError(
41 |         status_code=500,
42 |         detail="Traceback:\n  File 'app.py', line 123\n  raise ValueError('oops')",
43 |     )
44 |     details = format_error_details(error)
45 |     assert "Status code: 500" in details
46 |     assert "Server Traceback:" in details
47 |     assert "File 'app.py'" in details
48 | 
49 | 
50 | def test_format_http_error_with_text():
51 |     error = MockHTTPError(status_code=404, text="Not found")
52 |     details = format_error_details(error)
53 |     assert "Status code: 404" in details
54 |     assert "Response body: Not found" in details
55 | 


--------------------------------------------------------------------------------
/tutorials/evaluating_a_llama_agent.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# Llama Agent Inference (GPU)\n",
  8 |     "\n",
  9 |     "A notebook demonstrating how to use an agent powered by a local model (Llama 3.1 8B) to solve problems in the GSM8k test set using a calculator. **The tutorial assumes access to a GPU machine**.\n",
 10 |     "\n",
 11 |     "Note that the model struggles to output valid tool call syntax consistently, causing many failures.\n",
 12 |     "\n",
 13 |     "TODO: add EI notebook demonstrating how to address this\n",
 14 |     "\n",
 15 |     "NB: To run this notebook you need to install ldp with the `nn` dependency as well as the aviary dependencies\n",
 16 |     "\n",
 17 |     "```bash\n",
 18 |     "pip install \"ldp[nn]\" \"fhaviary[gsm8k]\"\n",
 19 |     "```"
 20 |    ]
 21 |   },
 22 |   {
 23 |    "cell_type": "code",
 24 |    "execution_count": null,
 25 |    "metadata": {},
 26 |    "outputs": [],
 27 |    "source": [
 28 |     "from aviary.envs.gsm8k import GSM8kDataset\n",
 29 |     "\n",
 30 |     "from ldp.alg import Evaluator, EvaluatorConfig\n",
 31 |     "from ldp.alg.callbacks import Callback\n",
 32 |     "from ldp.data_structures import Trajectory\n",
 33 |     "from ldp.nn import AgentLMConfig, SimpleLocalLLMAgent, TorchDType"
 34 |    ]
 35 |   },
 36 |   {
 37 |    "cell_type": "code",
 38 |    "execution_count": null,
 39 |    "metadata": {},
 40 |    "outputs": [],
 41 |    "source": [
 42 |     "class AccuracyCallback(Callback):\n",
 43 |     "    \"\"\"Simple callback that logs accuracy of each batch.\"\"\"\n",
 44 |     "\n",
 45 |     "    async def after_eval_step(self, trajectories: list[Trajectory]):\n",
 46 |     "        # CalculatorEnvironment returns a terminal reward of 1 if\n",
 47 |     "        # the agent solved the problem correctly.\n",
 48 |     "        pass_rate = sum(t.steps[-1].reward == 1 for t in trajectories) / len(\n",
 49 |     "            trajectories\n",
 50 |     "        )\n",
 51 |     "        print(f\"Pass rate: {100 * pass_rate:.2f}%\")"
 52 |    ]
 53 |   },
 54 |   {
 55 |    "cell_type": "code",
 56 |    "execution_count": null,
 57 |    "metadata": {},
 58 |    "outputs": [],
 59 |    "source": [
 60 |     "lm_config = AgentLMConfig(\n",
 61 |     "    model=\"meta-llama/Llama-3.1-8B-Instruct\",\n",
 62 |     "    dtype=TorchDType.bf16,\n",
 63 |     "    chat_template=\"llama3.1_chat_template_thought.jinja\",\n",
 64 |     "    max_new_tokens=100,\n",
 65 |     "    # Parameters for async inference\n",
 66 |     "    batch_size=8,  # fits onto a single 4090 with these params\n",
 67 |     "    max_wait_interval=10.0,\n",
 68 |     ")\n",
 69 |     "agent = SimpleLocalLLMAgent(lm_config)"
 70 |    ]
 71 |   },
 72 |   {
 73 |    "cell_type": "code",
 74 |    "execution_count": null,
 75 |    "metadata": {},
 76 |    "outputs": [],
 77 |    "source": [
 78 |     "dataset = GSM8kDataset(split=\"test\")\n",
 79 |     "callback = AccuracyCallback()\n",
 80 |     "evaluator = Evaluator(\n",
 81 |     "    config=EvaluatorConfig(\n",
 82 |     "        batch_size=64,\n",
 83 |     "        num_eval_iterations=1,  # Only run one batch, then exit\n",
 84 |     "        max_rollout_steps=10,\n",
 85 |     "    ),\n",
 86 |     "    agent=agent,\n",
 87 |     "    dataset=dataset,\n",
 88 |     "    callbacks=[callback],\n",
 89 |     ")\n",
 90 |     "\n",
 91 |     "# Note that Llama 3.1 8B does not always reliably follow the tool-calling\n",
 92 |     "# syntax, so we will see several (caught) errors. The pass rate will be <10%.\n",
 93 |     "await evaluator.evaluate()"
 94 |    ]
 95 |   }
 96 |  ],
 97 |  "metadata": {
 98 |   "kernelspec": {
 99 |    "display_name": "Python 3 (ipykernel)",
100 |    "language": "python",
101 |    "name": "python3"
102 |   },
103 |   "language_info": {
104 |    "codemirror_mode": {
105 |     "name": "ipython",
106 |     "version": 3
107 |    },
108 |    "file_extension": ".py",
109 |    "mimetype": "text/x-python",
110 |    "name": "python",
111 |    "nbconvert_exporter": "python",
112 |    "pygments_lexer": "ipython3"
113 |   }
114 |  },
115 |  "nbformat": 4,
116 |  "nbformat_minor": 4
117 | }
118 | 


--------------------------------------------------------------------------------