├── .github
    └── workflows
    │   └── publish.yml
├── LICENSE
├── README.md
├── extension
    ├── .gitignore
    ├── README.md
    ├── components.json
    ├── package-lock.json
    ├── package.json
    ├── src
    │   ├── assets
    │   │   ├── react.svg
    │   │   └── tailwind.css
    │   ├── components
    │   │   └── ui
    │   │   │   └── button.tsx
    │   ├── entrypoints
    │   │   ├── background.ts
    │   │   ├── content.ts
    │   │   └── sidepanel
    │   │   │   ├── components
    │   │   │       ├── error-view.tsx
    │   │   │       ├── event-viewer.tsx
    │   │   │       ├── initial-view.tsx
    │   │   │       ├── logina-view.tsx
    │   │   │       ├── recording-view.tsx
    │   │   │       └── stopped-view.tsx
    │   │   │   ├── context
    │   │   │       └── workflow-provider.tsx
    │   │   │   ├── index.html
    │   │   │   └── index.tsx
    │   ├── lib
    │   │   ├── message-bus-types.ts
    │   │   ├── types.ts
    │   │   ├── utils.ts
    │   │   └── workflow-types.ts
    │   └── public
    │   │   ├── icon
    │   │       ├── 128.png
    │   │       ├── 16.png
    │   │       ├── 32.png
    │   │       └── 48.png
    │   │   └── wxt.svg
    ├── tsconfig.json
    ├── vite.config.ts
    └── wxt.config.ts
├── static
    └── workflow-use.png
├── ui
    ├── .eslintrc.cjs
    ├── .github
    │   └── dependabot.yml
    ├── .gitignore
    ├── index.html
    ├── package-lock.json
    ├── package.json
    ├── public
    │   ├── browseruse.png
    │   └── favicon.ico
    ├── src
    │   ├── App.tsx
    │   ├── components
    │   │   ├── log-viewer.tsx
    │   │   ├── no-workflow-message.tsx
    │   │   ├── node-config-menu.tsx
    │   │   ├── play-button.tsx
    │   │   ├── sidebar.tsx
    │   │   ├── workflow-item.tsx
    │   │   └── workflow-layout.tsx
    │   ├── index.css
    │   ├── lib
    │   │   └── api
    │   │   │   ├── index.ts
    │   │   │   └── openapi.json
    │   ├── main.tsx
    │   ├── types
    │   │   ├── log-viewer.types.ts
    │   │   ├── node-config-menu.types.ts
    │   │   ├── play-button.types.ts
    │   │   ├── sidebar.types.ts
    │   │   └── workflow-layout.types.ts
    │   ├── utils
    │   │   └── json-to-flow.ts
    │   └── vite-env.d.ts
    ├── tsconfig.json
    ├── tsconfig.node.json
    └── vite.config.ts
└── workflows
    ├── .env.example
    ├── .gitignore
    ├── .python-version
    ├── .vscode
        ├── launch.json
        └── settings.json
    ├── README.md
    ├── backend
        ├── api.py
        ├── routers.py
        ├── service.py
        └── views.py
    ├── cli.py
    ├── examples
        ├── example.workflow.json
        └── runner.py
    ├── pyproject.toml
    ├── uv.lock
    └── workflow_use
        ├── __init__.py
        ├── builder
            ├── prompts.py
            ├── service.py
            └── tests
            │   └── build_workflow.py
        ├── controller
            ├── service.py
            ├── utils.py
            └── views.py
        ├── mcp
            ├── service.py
            └── tests
            │   └── test_tools.py
        ├── recorder
            ├── recorder.py
            ├── service.py
            └── views.py
        ├── schema
            └── views.py
        └── workflow
            ├── prompts.py
            ├── service.py
            ├── tests
                ├── run_workflow.py
                └── test_extract.py
            └── views.py


/.github/workflows/publish.yml:
--------------------------------------------------------------------------------
 1 | # This workflow will upload a Python Package using Twine when a release is created
 2 | # For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python#publishing-to-package-registries
 3 | 
 4 | # This workflow uses actions that are not certified by GitHub.
 5 | # They are provided by a third-party and are governed by
 6 | # separate terms of service, privacy policy, and support
 7 | # documentation.
 8 | 
 9 | name: publish
10 | 
11 | on:
12 |   release:
13 |     types: [published] # publish full release to PyPI when a release is created on Github
14 |   schedule:
15 |     - cron: "0 17 * * FRI" # tag a pre-release on Github every Friday at 5 PM UTC
16 | 
17 | permissions:
18 |   contents: write
19 |   id-token: write
20 | 
21 | jobs:
22 |   tag_pre_release:
23 |     if: github.event_name == 'schedule'
24 |     runs-on: ubuntu-latest
25 |     defaults:
26 |       run:
27 |         working-directory: workflows
28 |     steps:
29 |       - uses: actions/checkout@v4
30 |       - name: Create pre-release tag
31 |         run: |
32 |           git fetch --tags
33 |           latest_tag=$(git tag --list --sort=-v:refname | grep -E '^v[0-9]+\.[0-9]+\.[0-9]+rc[0-9]+$' | head -n 1)
34 |           if [ -z "$latest_tag" ]; then
35 |             new_tag="v0.1.0rc1"
36 |           else
37 |             new_tag=$(echo $latest_tag | awk -F'rc' '{print $1 "rc" $2+1}')
38 |           fi
39 |           git tag $new_tag
40 |           git push origin $new_tag
41 | 
42 |   publish_to_pypi:
43 |     if: github.event_name == 'release'
44 |     runs-on: ubuntu-latest
45 |     defaults:
46 |       run:
47 |         working-directory: workflows
48 |     steps:
49 |       - uses: actions/checkout@v4
50 |       - name: Set up Python
51 |         uses: actions/setup-python@v5
52 |         with:
53 |           python-version: "3.x"
54 |       - uses: astral-sh/setup-uv@v5
55 |       - run: uv run ruff check --no-fix --select PLE # check only for syntax errors
56 |       - run: uv build
57 |       - run: uv publish --trusted-publishing always
58 |       - name: Push to stable branch (if stable release)
59 |         if: startsWith(github.ref_name, 'v') && !contains(github.ref_name, 'rc')
60 |         run: |
61 |           git checkout -b stable
62 |           git push origin stable
63 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | <picture>
  2 |   <img alt="Workflow Use logo - a product by Browser Use." src="./static/workflow-use.png"  width="full">
  3 | </picture>
  4 | 
  5 | <br />
  6 | 
  7 | <h1 align="center">Deterministic, Self Healing Workflows (RPA 2.0)</h1>
  8 | 
  9 | [![GitHub stars](https://img.shields.io/github/stars/browser-use/workflow-use?style=social)](https://github.com/browser-use/workflow-use/stargazers)
 10 | [![Discord](https://img.shields.io/discord/1303749220842340412?color=7289DA&label=Discord&logo=discord&logoColor=white)](https://link.browser-use.com/discord)
 11 | [![Cloud](https://img.shields.io/badge/Cloud-☁️-blue)](https://cloud.browser-use.com)
 12 | [![Twitter Follow](https://img.shields.io/twitter/follow/Gregor?style=social)](https://x.com/gregpr07)
 13 | [![Twitter Follow](https://img.shields.io/twitter/follow/Magnus?style=social)](https://x.com/mamagnus00)
 14 | 
 15 | ⚙️ **Workflow Use** is the easiest way to create and execute deterministic workflows with variables which fallback to [Browser Use](https://github.com/browser-use/browser-use) if a step fails. You just _show_ the recorder the workflow, we automatically generate the workflow.
 16 | 
 17 | ❗ This project is in very early development so we don't recommend using this in production. Lots of things will change and we don't have a release schedule yet. Originally, the project was born out of customer demand to make Browser Use more reliable and deterministic.
 18 | 
 19 | # Quick start
 20 | 
 21 | ```bash
 22 | git clone https://github.com/browser-use/workflow-use
 23 | ```
 24 | 
 25 | ## Build the extension
 26 | 
 27 | ```bash
 28 | cd extension && npm install && npm run build
 29 | ```
 30 | 
 31 | ## Setup workflow environment
 32 | 
 33 | ```bash
 34 | cd .. && cd workflows
 35 | uv sync
 36 | source .venv/bin/activate # for mac / linux
 37 | playwright install chromium
 38 | cp .env.example .env # add your OPENAI_API_KEY to the .env file
 39 | ```
 40 | 
 41 | 
 42 | ## Run workflow as tool
 43 | 
 44 | ```bash
 45 | python cli.py run-as-tool examples/example.workflow.json --prompt "fill the form with example data"
 46 | ```
 47 | 
 48 | ## Run workflow with predefined variables
 49 | 
 50 | ```bash
 51 | python cli.py run-workflow examples/example.workflow.json 
 52 | ```
 53 | 
 54 | ## Record your own workflow
 55 | 
 56 | ```bash
 57 | python cli.py create-workflow
 58 | ```
 59 | 
 60 | ## See all commands
 61 | 
 62 | ```bash
 63 | python cli.py --help
 64 | ```
 65 | 
 66 | # Usage from python
 67 | 
 68 | Running the workflow files is as simple as:
 69 | 
 70 | ```python
 71 | from workflow_use import Workflow
 72 | 
 73 | workflow = Workflow.load_from_file("example.workflow.json")
 74 | result = asyncio.run(workflow.run_as_tool("I want to search for 'workflow use'"))
 75 | ```
 76 | 
 77 | ## Launch the GUI
 78 | 
 79 | The Workflow UI provides a visual interface for managing, viewing, and executing workflows.
 80 | 
 81 | ### Option 1: Using the CLI command (Recommended)
 82 | 
 83 | The easiest way to start the GUI is with the built-in CLI command:
 84 | 
 85 | ```bash
 86 | cd workflows
 87 | python cli.py launch-gui
 88 | ```
 89 | 
 90 | This command will:
 91 | - Start the backend server (FastAPI)
 92 | - Start the frontend development server
 93 | - Automatically open http://localhost:5173 in your browser
 94 | - Capture logs to the `./tmp/logs` directory
 95 | 
 96 | Press Ctrl+C to stop both servers when you're done.
 97 | 
 98 | ### Option 2: Start servers separately
 99 | 
100 | Alternatively, you can start the servers individually:
101 | 
102 | #### Start the backend server
103 | 
104 | ```bash
105 | cd workflows
106 | uvicorn backend.api:app --reload
107 | ```
108 | 
109 | #### Start the frontend development server
110 | 
111 | ```bash
112 | cd ui
113 | npm install
114 | npm run dev
115 | ```
116 | 
117 | Once both servers are running, you can access the Workflow GUI at http://localhost:5173 in your browser. The UI allows you to:
118 | 
119 | - Visualize workflows as interactive graphs
120 | - Execute workflows with custom input parameters
121 | - Monitor workflow execution logs in real-time
122 | - Edit workflow metadata and details
123 | 
124 | # Demos
125 | 
126 | ## Workflow Use filling out form instantly
127 | 
128 | https://github.com/user-attachments/assets/cf284e08-8c8c-484a-820a-02c507de11d4
129 | 
130 | ## Gregor's explanation
131 | 
132 | https://github.com/user-attachments/assets/379e57c7-f03e-4eb9-8184-521377d5c0f9
133 | 
134 | # Features
135 | 
136 | - 🔁 **Record Once, Reuse Forever**: Record browser interactions once and replay them indefinitely.
137 | - ⏳ **Show, don't prompt**: No need to spend hours prompting Browser Use to do the same thing over and over again.
138 | - ⚙️ **Structured & Executable Workflows**: Converts recordings into deterministic, fast, and reliable workflows which automatically extract variables from forms.
139 | - 🪄 **Human-like Interaction Understanding**: Intelligently filters noise from recordings to create meaningful workflows.
140 | - 🔒 **Enterprise-Ready Foundation**: Built for future scalability with features like self-healing and workflow diffs.
141 | 
142 | # Vision and roadmap
143 | 
144 | Show computer what it needs to do once, and it will do it over and over again without any human intervention.
145 | 
146 | ## Workflows
147 | 
148 | - [ ] Nice way to use the `.json` files inside python code
149 | - [ ] Improve LLM fallback when step fails (currently really bad)
150 | - [ ] Self healing, if it fails automatically agent kicks in and updates the workflow file
151 | - [ ] Better support for LLM steps
152 | - [ ] Take output from previous steps and use it as input for next steps
153 | - [ ] Expose workflows as MCP tools
154 | - [ ] Use Browser Use to automatically create workflows from websites
155 | 
156 | ## Developer experience
157 | 
158 | - [ ] Improve CLI
159 | - [ ] Improve extension
160 | - [ ] Step editor
161 | 
162 | ## Agent
163 | 
164 | - [ ] Allow Browser Use to use the workflows as MCP tools
165 | - [ ] Use workflows as website caching layer
166 | 


--------------------------------------------------------------------------------
/extension/.gitignore:
--------------------------------------------------------------------------------
 1 | # Logs
 2 | logs
 3 | *.log
 4 | npm-debug.log*
 5 | yarn-debug.log*
 6 | yarn-error.log*
 7 | pnpm-debug.log*
 8 | lerna-debug.log*
 9 | 
10 | node_modules
11 | .output
12 | stats.html
13 | stats-*.json
14 | .wxt
15 | web-ext.config.ts
16 | 
17 | # Editor directories and files
18 | .vscode/*
19 | !.vscode/extensions.json
20 | .idea
21 | .DS_Store
22 | *.suo
23 | *.ntvs*
24 | *.njsproj
25 | *.sln
26 | *.sw?
27 | 


--------------------------------------------------------------------------------
/extension/README.md:
--------------------------------------------------------------------------------
1 | # WXT + React
2 | 
3 | This template should help get you started developing with React in WXT.
4 | 


--------------------------------------------------------------------------------
/extension/components.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "$schema": "https://ui.shadcn.com/schema.json",
 3 |   "style": "new-york",
 4 |   "rsc": false,
 5 |   "tsx": true,
 6 |   "tailwind": {
 7 |     "config": "",
 8 |     "css": "assets/tailwind.css",
 9 |     "baseColor": "neutral",
10 |     "cssVariables": true,
11 |     "prefix": ""
12 |   },
13 |   "aliases": {
14 |     "components": "@/components",
15 |     "utils": "@/lib/utils",
16 |     "ui": "@/components/ui",
17 |     "lib": "@/lib",
18 |     "hooks": "@/hooks"
19 |   },
20 |   "iconLibrary": "lucide"
21 | }


--------------------------------------------------------------------------------
/extension/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "browser-use-workflow-recorder",
 3 |   "description": "record and enchance workflows for browser use",
 4 |   "private": true,
 5 |   "version": "0.0.0",
 6 |   "type": "module",
 7 |   "scripts": {
 8 |     "dev": "wxt",
 9 |     "dev:firefox": "wxt -b firefox",
10 |     "build": "wxt build",
11 |     "build:firefox": "wxt build -b firefox",
12 |     "zip": "wxt zip",
13 |     "zip:firefox": "wxt zip -b firefox",
14 |     "compile": "tsc --noEmit",
15 |     "postinstall": "wxt prepare"
16 |   },
17 |   "dependencies": {
18 |     "@radix-ui/react-slot": "^1.2.0",
19 |     "@tailwindcss/vite": "^4.1.5",
20 |     "class-variance-authority": "^0.7.1",
21 |     "clsx": "^2.1.1",
22 |     "lucide-react": "^0.507.0",
23 |     "react": "^19.1.0",
24 |     "react-dom": "^19.1.0",
25 |     "rrweb": "^2.0.0-alpha.4",
26 |     "tailwind-merge": "^3.2.0",
27 |     "tailwindcss": "^4.1.5"
28 |   },
29 |   "devDependencies": {
30 |     "@types/chrome": "^0.0.318",
31 |     "@types/node": "^22.15.3",
32 |     "@types/react": "^19.1.2",
33 |     "@types/react-dom": "^19.1.3",
34 |     "@wxt-dev/module-react": "^1.1.3",
35 |     "tw-animate-css": "^1.2.9",
36 |     "typescript": "^5.8.3",
37 |     "wxt": "^0.20.6"
38 |   }
39 | }
40 | 


--------------------------------------------------------------------------------
/extension/src/assets/react.svg:
--------------------------------------------------------------------------------
1 | <svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" class="iconify iconify--logos" width="35.93" height="32" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 228"><path fill="#00D8FF" d="M210.483 73.824a171.49 171.49 0 0 0-8.24-2.597c.465-1.9.893-3.777 1.273-5.621c6.238-30.281 2.16-54.676-11.769-62.708c-13.355-7.7-35.196.329-57.254 19.526a171.23 171.23 0 0 0-6.375 5.848a155.866 155.866 0 0 0-4.241-3.917C100.759 3.829 77.587-4.822 63.673 3.233C50.33 10.957 46.379 33.89 51.995 62.588a170.974 170.974 0 0 0 1.892 8.48c-3.28.932-6.445 1.924-9.474 2.98C17.309 83.498 0 98.307 0 113.668c0 15.865 18.582 31.778 46.812 41.427a145.52 145.52 0 0 0 6.921 2.165a167.467 167.467 0 0 0-2.01 9.138c-5.354 28.2-1.173 50.591 12.134 58.266c13.744 7.926 36.812-.22 59.273-19.855a145.567 145.567 0 0 0 5.342-4.923a168.064 168.064 0 0 0 6.92 6.314c21.758 18.722 43.246 26.282 56.54 18.586c13.731-7.949 18.194-32.003 12.4-61.268a145.016 145.016 0 0 0-1.535-6.842c1.62-.48 3.21-.974 4.76-1.488c29.348-9.723 48.443-25.443 48.443-41.52c0-15.417-17.868-30.326-45.517-39.844Zm-6.365 70.984c-1.4.463-2.836.91-4.3 1.345c-3.24-10.257-7.612-21.163-12.963-32.432c5.106-11 9.31-21.767 12.459-31.957c2.619.758 5.16 1.557 7.61 2.4c23.69 8.156 38.14 20.213 38.14 29.504c0 9.896-15.606 22.743-40.946 31.14Zm-10.514 20.834c2.562 12.94 2.927 24.64 1.23 33.787c-1.524 8.219-4.59 13.698-8.382 15.893c-8.067 4.67-25.32-1.4-43.927-17.412a156.726 156.726 0 0 1-6.437-5.87c7.214-7.889 14.423-17.06 21.459-27.246c12.376-1.098 24.068-2.894 34.671-5.345a134.17 134.17 0 0 1 1.386 6.193ZM87.276 214.515c-7.882 2.783-14.16 2.863-17.955.675c-8.075-4.657-11.432-22.636-6.853-46.752a156.923 156.923 0 0 1 1.869-8.499c10.486 2.32 22.093 3.988 34.498 4.994c7.084 9.967 14.501 19.128 21.976 27.15a134.668 134.668 0 0 1-4.877 4.492c-9.933 8.682-19.886 14.842-28.658 17.94ZM50.35 144.747c-12.483-4.267-22.792-9.812-29.858-15.863c-6.35-5.437-9.555-10.836-9.555-15.216c0-9.322 13.897-21.212 37.076-29.293c2.813-.98 5.757-1.905 8.812-2.773c3.204 10.42 7.406 21.315 12.477 32.332c-5.137 11.18-9.399 22.249-12.634 32.792a134.718 134.718 0 0 1-6.318-1.979Zm12.378-84.26c-4.811-24.587-1.616-43.134 6.425-47.789c8.564-4.958 27.502 2.111 47.463 19.835a144.318 144.318 0 0 1 3.841 3.545c-7.438 7.987-14.787 17.08-21.808 26.988c-12.04 1.116-23.565 2.908-34.161 5.309a160.342 160.342 0 0 1-1.76-7.887Zm110.427 27.268a347.8 347.8 0 0 0-7.785-12.803c8.168 1.033 15.994 2.404 23.343 4.08c-2.206 7.072-4.956 14.465-8.193 22.045a381.151 381.151 0 0 0-7.365-13.322Zm-45.032-43.861c5.044 5.465 10.096 11.566 15.065 18.186a322.04 322.04 0 0 0-30.257-.006c4.974-6.559 10.069-12.652 15.192-18.18ZM82.802 87.83a323.167 323.167 0 0 0-7.227 13.238c-3.184-7.553-5.909-14.98-8.134-22.152c7.304-1.634 15.093-2.97 23.209-3.984a321.524 321.524 0 0 0-7.848 12.897Zm8.081 65.352c-8.385-.936-16.291-2.203-23.593-3.793c2.26-7.3 5.045-14.885 8.298-22.6a321.187 321.187 0 0 0 7.257 13.246c2.594 4.48 5.28 8.868 8.038 13.147Zm37.542 31.03c-5.184-5.592-10.354-11.779-15.403-18.433c4.902.192 9.899.29 14.978.29c5.218 0 10.376-.117 15.453-.343c-4.985 6.774-10.018 12.97-15.028 18.486Zm52.198-57.817c3.422 7.8 6.306 15.345 8.596 22.52c-7.422 1.694-15.436 3.058-23.88 4.071a382.417 382.417 0 0 0 7.859-13.026a347.403 347.403 0 0 0 7.425-13.565Zm-16.898 8.101a358.557 358.557 0 0 1-12.281 19.815a329.4 329.4 0 0 1-23.444.823c-7.967 0-15.716-.248-23.178-.732a310.202 310.202 0 0 1-12.513-19.846h.001a307.41 307.41 0 0 1-10.923-20.627a310.278 310.278 0 0 1 10.89-20.637l-.001.001a307.318 307.318 0 0 1 12.413-19.761c7.613-.576 15.42-.876 23.31-.876H128c7.926 0 15.743.303 23.354.883a329.357 329.357 0 0 1 12.335 19.695a358.489 358.489 0 0 1 11.036 20.54a329.472 329.472 0 0 1-11 20.722Zm22.56-122.124c8.572 4.944 11.906 24.881 6.52 51.026c-.344 1.668-.73 3.367-1.15 5.09c-10.622-2.452-22.155-4.275-34.23-5.408c-7.034-10.017-14.323-19.124-21.64-27.008a160.789 160.789 0 0 1 5.888-5.4c18.9-16.447 36.564-22.941 44.612-18.3ZM128 90.808c12.625 0 22.86 10.235 22.86 22.86s-10.235 22.86-22.86 22.86s-22.86-10.235-22.86-22.86s10.235-22.86 22.86-22.86Z"></path></svg>
2 | 


--------------------------------------------------------------------------------
/extension/src/assets/tailwind.css:
--------------------------------------------------------------------------------
  1 | @import "tailwindcss";
  2 | @import "tw-animate-css";
  3 | 
  4 | @custom-variant dark (&:is(.dark *));
  5 | 
  6 | @theme inline {
  7 |   --radius-sm: calc(var(--radius) - 4px);
  8 |   --radius-md: calc(var(--radius) - 2px);
  9 |   --radius-lg: var(--radius);
 10 |   --radius-xl: calc(var(--radius) + 4px);
 11 |   --color-background: var(--background);
 12 |   --color-foreground: var(--foreground);
 13 |   --color-card: var(--card);
 14 |   --color-card-foreground: var(--card-foreground);
 15 |   --color-popover: var(--popover);
 16 |   --color-popover-foreground: var(--popover-foreground);
 17 |   --color-primary: var(--primary);
 18 |   --color-primary-foreground: var(--primary-foreground);
 19 |   --color-secondary: var(--secondary);
 20 |   --color-secondary-foreground: var(--secondary-foreground);
 21 |   --color-muted: var(--muted);
 22 |   --color-muted-foreground: var(--muted-foreground);
 23 |   --color-accent: var(--accent);
 24 |   --color-accent-foreground: var(--accent-foreground);
 25 |   --color-destructive: var(--destructive);
 26 |   --color-border: var(--border);
 27 |   --color-input: var(--input);
 28 |   --color-ring: var(--ring);
 29 |   --color-chart-1: var(--chart-1);
 30 |   --color-chart-2: var(--chart-2);
 31 |   --color-chart-3: var(--chart-3);
 32 |   --color-chart-4: var(--chart-4);
 33 |   --color-chart-5: var(--chart-5);
 34 |   --color-sidebar: var(--sidebar);
 35 |   --color-sidebar-foreground: var(--sidebar-foreground);
 36 |   --color-sidebar-primary: var(--sidebar-primary);
 37 |   --color-sidebar-primary-foreground: var(--sidebar-primary-foreground);
 38 |   --color-sidebar-accent: var(--sidebar-accent);
 39 |   --color-sidebar-accent-foreground: var(--sidebar-accent-foreground);
 40 |   --color-sidebar-border: var(--sidebar-border);
 41 |   --color-sidebar-ring: var(--sidebar-ring);
 42 | }
 43 | 
 44 | :root {
 45 |   --radius: 0.625rem;
 46 |   --background: oklch(1 0 0);
 47 |   --foreground: oklch(0.145 0 0);
 48 |   --card: oklch(1 0 0);
 49 |   --card-foreground: oklch(0.145 0 0);
 50 |   --popover: oklch(1 0 0);
 51 |   --popover-foreground: oklch(0.145 0 0);
 52 |   --primary: oklch(0.205 0 0);
 53 |   --primary-foreground: oklch(0.985 0 0);
 54 |   --secondary: oklch(0.97 0 0);
 55 |   --secondary-foreground: oklch(0.205 0 0);
 56 |   --muted: oklch(0.97 0 0);
 57 |   --muted-foreground: oklch(0.556 0 0);
 58 |   --accent: oklch(0.97 0 0);
 59 |   --accent-foreground: oklch(0.205 0 0);
 60 |   --destructive: oklch(0.577 0.245 27.325);
 61 |   --border: oklch(0.922 0 0);
 62 |   --input: oklch(0.922 0 0);
 63 |   --ring: oklch(0.708 0 0);
 64 |   --chart-1: oklch(0.646 0.222 41.116);
 65 |   --chart-2: oklch(0.6 0.118 184.704);
 66 |   --chart-3: oklch(0.398 0.07 227.392);
 67 |   --chart-4: oklch(0.828 0.189 84.429);
 68 |   --chart-5: oklch(0.769 0.188 70.08);
 69 |   --sidebar: oklch(0.985 0 0);
 70 |   --sidebar-foreground: oklch(0.145 0 0);
 71 |   --sidebar-primary: oklch(0.205 0 0);
 72 |   --sidebar-primary-foreground: oklch(0.985 0 0);
 73 |   --sidebar-accent: oklch(0.97 0 0);
 74 |   --sidebar-accent-foreground: oklch(0.205 0 0);
 75 |   --sidebar-border: oklch(0.922 0 0);
 76 |   --sidebar-ring: oklch(0.708 0 0);
 77 | }
 78 | 
 79 | .dark {
 80 |   --background: oklch(0.145 0 0);
 81 |   --foreground: oklch(0.985 0 0);
 82 |   --card: oklch(0.205 0 0);
 83 |   --card-foreground: oklch(0.985 0 0);
 84 |   --popover: oklch(0.205 0 0);
 85 |   --popover-foreground: oklch(0.985 0 0);
 86 |   --primary: oklch(0.922 0 0);
 87 |   --primary-foreground: oklch(0.205 0 0);
 88 |   --secondary: oklch(0.269 0 0);
 89 |   --secondary-foreground: oklch(0.985 0 0);
 90 |   --muted: oklch(0.269 0 0);
 91 |   --muted-foreground: oklch(0.708 0 0);
 92 |   --accent: oklch(0.269 0 0);
 93 |   --accent-foreground: oklch(0.985 0 0);
 94 |   --destructive: oklch(0.704 0.191 22.216);
 95 |   --border: oklch(1 0 0 / 10%);
 96 |   --input: oklch(1 0 0 / 15%);
 97 |   --ring: oklch(0.556 0 0);
 98 |   --chart-1: oklch(0.488 0.243 264.376);
 99 |   --chart-2: oklch(0.696 0.17 162.48);
100 |   --chart-3: oklch(0.769 0.188 70.08);
101 |   --chart-4: oklch(0.627 0.265 303.9);
102 |   --chart-5: oklch(0.645 0.246 16.439);
103 |   --sidebar: oklch(0.205 0 0);
104 |   --sidebar-foreground: oklch(0.985 0 0);
105 |   --sidebar-primary: oklch(0.488 0.243 264.376);
106 |   --sidebar-primary-foreground: oklch(0.985 0 0);
107 |   --sidebar-accent: oklch(0.269 0 0);
108 |   --sidebar-accent-foreground: oklch(0.985 0 0);
109 |   --sidebar-border: oklch(1 0 0 / 10%);
110 |   --sidebar-ring: oklch(0.556 0 0);
111 | }
112 | 
113 | @layer base {
114 |   * {
115 |     @apply border-border outline-ring/50;
116 |   }
117 |   body {
118 |     @apply bg-background text-foreground;
119 |   }
120 | }
121 | 


--------------------------------------------------------------------------------
/extension/src/components/ui/button.tsx:
--------------------------------------------------------------------------------
 1 | import * as React from "react";
 2 | import { Slot } from "@radix-ui/react-slot";
 3 | import { cva, type VariantProps } from "class-variance-authority";
 4 | 
 5 | import { cn } from "@/lib/utils";
 6 | 
 7 | const buttonVariants = cva(
 8 |   "inline-flex items-center justify-center gap-2 whitespace-nowrap rounded-md text-sm font-medium transition-all disabled:pointer-events-none disabled:opacity-50 [&_svg]:pointer-events-none [&_svg:not([class*='size-'])]:size-4 shrink-0 [&_svg]:shrink-0 outline-none focus-visible:border-ring focus-visible:ring-ring/50 focus-visible:ring-[3px] aria-invalid:ring-destructive/20 dark:aria-invalid:ring-destructive/40 aria-invalid:border-destructive",
 9 |   {
10 |     variants: {
11 |       variant: {
12 |         default:
13 |           "bg-primary text-primary-foreground shadow-xs hover:bg-primary/90",
14 |         destructive:
15 |           "bg-destructive text-white shadow-xs hover:bg-destructive/90 focus-visible:ring-destructive/20 dark:focus-visible:ring-destructive/40 dark:bg-destructive/60",
16 |         outline:
17 |           "border bg-background shadow-xs hover:bg-accent hover:text-accent-foreground dark:bg-input/30 dark:border-input dark:hover:bg-input/50",
18 |         secondary:
19 |           "bg-secondary text-secondary-foreground shadow-xs hover:bg-secondary/80",
20 |         ghost:
21 |           "hover:bg-accent hover:text-accent-foreground dark:hover:bg-accent/50",
22 |         link: "text-primary underline-offset-4 hover:underline",
23 |       },
24 |       size: {
25 |         default: "h-9 px-4 py-2 has-[>svg]:px-3",
26 |         sm: "h-8 rounded-md gap-1.5 px-3 has-[>svg]:px-2.5",
27 |         lg: "h-10 rounded-md px-6 has-[>svg]:px-4",
28 |         icon: "size-9",
29 |       },
30 |     },
31 |     defaultVariants: {
32 |       variant: "default",
33 |       size: "default",
34 |     },
35 |   }
36 | );
37 | 
38 | function Button({
39 |   className,
40 |   variant,
41 |   size,
42 |   asChild = false,
43 |   ...props
44 | }: React.ComponentProps<"button"> &
45 |   VariantProps<typeof buttonVariants> & {
46 |     asChild?: boolean;
47 |   }) {
48 |   const Comp = asChild ? Slot : "button";
49 | 
50 |   return (
51 |     <Comp
52 |       data-slot="button"
53 |       className={cn(buttonVariants({ variant, size, className }))}
54 |       {...props}
55 |     />
56 |   );
57 | }
58 | 
59 | export { Button, buttonVariants };
60 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/components/error-view.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { useWorkflow } from "../context/workflow-provider";
 3 | import { Button } from "@/components/ui/button";
 4 | 
 5 | export const ErrorView: React.FC = () => {
 6 |   const { error, fetchWorkflowData, startRecording } = useWorkflow();
 7 | 
 8 |   const handleRetry = () => {
 9 |     // Try fetching data again
10 |     fetchWorkflowData();
11 |   };
12 | 
13 |   const handleStartNew = () => {
14 |     // Reset state and start recording
15 |     startRecording();
16 |   };
17 | 
18 |   return (
19 |     <div className="flex flex-col items-center justify-center h-full space-y-4 p-4 text-center">
20 |       <h2 className="text-lg font-semibold text-destructive">
21 |         An Error Occurred
22 |       </h2>
23 |       <p className="text-sm text-muted-foreground">
24 |         {error || "An unexpected error occurred."}
25 |       </p>
26 |       <div className="flex space-x-2">
27 |         <Button variant="outline" onClick={handleRetry}>
28 |           Retry Load
29 |         </Button>
30 |         <Button variant="secondary" onClick={handleStartNew}>
31 |           Start New Recording
32 |         </Button>
33 |       </div>
34 |     </div>
35 |   );
36 | };
37 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/components/event-viewer.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useEffect, useRef } from "react";
  2 | import {
  3 |   ClickStep,
  4 |   InputStep,
  5 |   KeyPressStep,
  6 |   NavigationStep,
  7 |   ScrollStep,
  8 |   Step,
  9 | } from "../../../lib/workflow-types"; // Adjust path as needed
 10 | import { useWorkflow } from "../context/workflow-provider";
 11 | 
 12 | // Helper to get the specific screenshot for a step
 13 | const getScreenshot = (step: Step): string | undefined => {
 14 |   if ("screenshot" in step) {
 15 |     return step.screenshot;
 16 |   }
 17 |   return undefined;
 18 | };
 19 | 
 20 | // Component to render a single step as a card
 21 | const StepCard: React.FC<{
 22 |   step: Step;
 23 |   index: number;
 24 |   isSelected: boolean;
 25 |   onSelect: () => void;
 26 | }> = ({ step, index, isSelected, onSelect }) => {
 27 |   const screenshot = getScreenshot(step);
 28 |   const canShowScreenshot = ["click", "input", "key_press"].includes(step.type);
 29 | 
 30 |   // --- Step Summary Renderer (Top part of the card) ---
 31 |   const renderStepSummary = (step: Step) => {
 32 |     switch (step.type) {
 33 |       case "click": {
 34 |         const s = step as ClickStep;
 35 |         return (
 36 |           <div className="flex items-center space-x-2">
 37 |             <span className="text-lg">🖱️</span>
 38 |             <span className="truncate">
 39 |               Click on <strong>{s.elementTag}</strong>
 40 |               {s.elementText && `: "${s.elementText}"`}
 41 |             </span>
 42 |           </div>
 43 |         );
 44 |       }
 45 |       case "input": {
 46 |         const s = step as InputStep;
 47 |         return (
 48 |           <div className="flex items-center space-x-2">
 49 |             <span className="text-lg">⌨️</span>
 50 |             <span className="truncate">
 51 |               Input into <strong>{s.elementTag}</strong>: "{s.value}"
 52 |             </span>
 53 |           </div>
 54 |         );
 55 |       }
 56 |       case "key_press": {
 57 |         const s = step as KeyPressStep;
 58 |         return (
 59 |           <div className="flex items-center space-x-2">
 60 |             <span className="text-lg">🔑</span>
 61 |             <span className="truncate">
 62 |               Press <strong>{s.key}</strong> on {s.elementTag || "document"}
 63 |             </span>
 64 |           </div>
 65 |         );
 66 |       }
 67 |       case "navigation": {
 68 |         const s = step as NavigationStep;
 69 |         return (
 70 |           <div className="flex items-center space-x-2">
 71 |             <span className="text-lg">🧭</span>
 72 |             <span className="truncate">Navigate: {s.url}</span>
 73 |           </div>
 74 |         );
 75 |       }
 76 |       case "scroll": {
 77 |         const s = step as ScrollStep;
 78 |         return (
 79 |           <div className="flex items-center space-x-2">
 80 |             <span className="text-lg">↕️</span>
 81 |             <span className="truncate">
 82 |               Scroll to ({s.scrollX}, {s.scrollY})
 83 |             </span>
 84 |           </div>
 85 |         );
 86 |       }
 87 |       default:
 88 |         return <>{(step as any).type}</>; // Fallback
 89 |     }
 90 |   };
 91 | 
 92 |   // --- Step Detail Renderer (Collapsible section or part of card body) ---
 93 |   const renderStepDetailsContent = (step: Step) => {
 94 |     const baseInfo = (
 95 |       <>
 96 |         <p>
 97 |           <strong>Timestamp:</strong>{" "}
 98 |           {new Date(step.timestamp).toLocaleString()}
 99 |         </p>
100 |         {step.url && (
101 |           <p>
102 |             <strong>URL:</strong> {step.url}
103 |           </p>
104 |         )}
105 |         {/* Tab ID might be less relevant now, could remove */}
106 |         {/* <p><strong>Tab ID:</strong> {step.tabId}</p> */}
107 |       </>
108 |     );
109 | 
110 |     let specificInfo = null;
111 | 
112 |     switch (step.type) {
113 |       case "click":
114 |       case "input":
115 |       case "key_press": {
116 |         const s = step as ClickStep | InputStep | KeyPressStep; // Union type
117 |         specificInfo = (
118 |           <>
119 |             {(s as ClickStep | InputStep).frameUrl &&
120 |               (s as ClickStep | InputStep).frameUrl !== s.url && (
121 |                 <p>
122 |                   <strong>Frame URL:</strong>{" "}
123 |                   {(s as ClickStep | InputStep).frameUrl}
124 |                 </p>
125 |               )}
126 |             {s.xpath && (
127 |               <p>
128 |                 <strong>XPath:</strong> {s.xpath}
129 |               </p>
130 |             )}
131 |             {s.cssSelector && (
132 |               <p>
133 |                 <strong>CSS:</strong> {s.cssSelector}
134 |               </p>
135 |             )}
136 |             {s.elementTag && (
137 |               <p>
138 |                 <strong>Element:</strong> {s.elementTag}
139 |               </p>
140 |             )}
141 |             {(s as ClickStep).elementText && (
142 |               <p>
143 |                 <strong>Text:</strong> {(s as ClickStep).elementText}
144 |               </p>
145 |             )}
146 |             {(s as InputStep).value && (
147 |               <p>
148 |                 <strong>Value:</strong> {(s as InputStep).value}
149 |               </p>
150 |             )}
151 |             {(s as KeyPressStep).key && (
152 |               <p>
153 |                 <strong>Key:</strong> {(s as KeyPressStep).key}
154 |               </p>
155 |             )}
156 |           </>
157 |         );
158 |         break;
159 |       }
160 |       case "navigation": {
161 |         // Base info already has URL
162 |         break;
163 |       }
164 |       case "scroll": {
165 |         const s = step as ScrollStep;
166 |         specificInfo = (
167 |           <>
168 |             <p>
169 |               <strong>Target ID:</strong> {s.targetId}
170 |             </p>
171 |             <p>
172 |               <strong>Scroll X:</strong> {s.scrollX}
173 |             </p>
174 |             <p>
175 |               <strong>Scroll Y:</strong> {s.scrollY}
176 |             </p>
177 |           </>
178 |         );
179 |         break;
180 |       }
181 |       default:
182 |         specificInfo = (
183 |           <p>Details not available for type: {(step as any).type}</p>
184 |         );
185 |     }
186 | 
187 |     return (
188 |       <div className="text-[10px] text-muted-foreground break-all mt-2 space-y-1">
189 |         {baseInfo}
190 |         {specificInfo}
191 |       </div>
192 |     );
193 |   };
194 | 
195 |   return (
196 |     <div
197 |       id={`event-item-${index}`} // Keep ID for potential scrolling
198 |       onClick={onSelect}
199 |       className={` 
200 |         border rounded-lg mb-3 overflow-hidden cursor-pointer transition-all duration-150 ease-in-out 
201 |         ${
202 |           isSelected
203 |             ? "border-primary shadow-md scale-[1.01]"
204 |             : "border-border hover:border-muted-foreground/50 hover:shadow-sm"
205 |         } 
206 |       `}
207 |     >
208 |       {/* Card Content using Flexbox */}
209 |       <div className="flex items-start p-3 space-x-3">
210 |         {/* Left side: Summary and Details */}
211 |         <div className="flex-grow overflow-hidden">
212 |           <div className="text-sm font-medium mb-2">
213 |             {renderStepSummary(step)}
214 |           </div>
215 |           {renderStepDetailsContent(step)}
216 |         </div>
217 | 
218 |         {/* Right side: Screenshot (if available) */}
219 |         {canShowScreenshot && screenshot && (
220 |           <div className="flex-shrink-0 w-24 h-auto border border-border rounded overflow-hidden shadow-sm ml-auto">
221 |             <img
222 |               src={screenshot}
223 |               alt={`Screenshot for step ${index + 1}`}
224 |               className="block w-full h-full object-cover"
225 |               loading="lazy" // Lazy load screenshots further down
226 |             />
227 |           </div>
228 |         )}
229 |       </div>
230 |     </div>
231 |   );
232 | };
233 | 
234 | // Main EventViewer component using the new card layout
235 | export const EventViewer: React.FC = () => {
236 |   const { workflow, currentEventIndex, selectEvent, recordingStatus } =
237 |     useWorkflow();
238 |   const steps = workflow?.steps || [];
239 |   const scrollContainerRef = useRef<HTMLDivElement>(null); // Ref for the scrollable div
240 | 
241 |   // Effect to scroll selected card into view
242 |   useEffect(() => {
243 |     if (recordingStatus !== "recording") {
244 |       // Only scroll selection when not recording
245 |       const element = document.getElementById(
246 |         `event-item-${currentEventIndex}`
247 |       );
248 |       element?.scrollIntoView({ behavior: "smooth", block: "center" });
249 |     }
250 |   }, [currentEventIndex, recordingStatus]); // Add recordingStatus dependency
251 | 
252 |   // Effect to scroll to bottom when new steps are added during recording
253 |   useEffect(() => {
254 |     if (recordingStatus === "recording" && scrollContainerRef.current) {
255 |       const { current: container } = scrollContainerRef;
256 |       // Use setTimeout to allow DOM update before scrolling
257 |       setTimeout(() => {
258 |         container.scrollTop = container.scrollHeight;
259 |         console.log("Scrolled to bottom due to new event during recording");
260 |       }, 0);
261 |     }
262 |     // Depend on the number of steps and recording status
263 |   }, [steps.length, recordingStatus]);
264 | 
265 |   if (!workflow || !workflow.steps || workflow.steps.length === 0) {
266 |     return (
267 |       <div className="flex items-center justify-center h-full text-muted-foreground p-6">
268 |         No events recorded yet.
269 |       </div>
270 |     );
271 |   }
272 | 
273 |   return (
274 |     // Assign the ref to the scrollable container
275 |     <div ref={scrollContainerRef} className="h-full overflow-y-auto p-0.5">
276 |       {" "}
277 |       {/* Single scrollable container */}
278 |       {steps.map((step, index) => (
279 |         <StepCard
280 |           key={index}
281 |           step={step}
282 |           index={index}
283 |           isSelected={index === currentEventIndex}
284 |           onSelect={() => selectEvent(index)}
285 |         />
286 |       ))}
287 |     </div>
288 |   );
289 | };
290 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/components/initial-view.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { useWorkflow } from "../context/workflow-provider";
 3 | import { Button } from "@/components/ui/button"; // Reverted to alias path
 4 | 
 5 | export const InitialView: React.FC = () => {
 6 |   const { startRecording } = useWorkflow();
 7 | 
 8 |   return (
 9 |     <div className="flex flex-col items-center justify-center h-full space-y-4">
10 |       <h2 className="text-lg font-semibold">Record a Workflow</h2>
11 | 
12 |       <Button onClick={startRecording}>Start Recording</Button>
13 |     </div>
14 |   );
15 | };
16 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/components/logina-view.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | 
 3 | // Simple loading spinner component
 4 | const Spinner: React.FC = () => (
 5 |   <svg
 6 |     className="animate-spin h-8 w-8 text-primary"
 7 |     xmlns="http://www.w3.org/2000/svg"
 8 |     fill="none"
 9 |     viewBox="0 0 24 24"
10 |   >
11 |     <circle
12 |       className="opacity-25"
13 |       cx="12"
14 |       cy="12"
15 |       r="10"
16 |       stroke="currentColor"
17 |       strokeWidth="4"
18 |     ></circle>
19 |     <path
20 |       className="opacity-75"
21 |       fill="currentColor"
22 |       d="M4 12a8 8 0 018-8V0C5.373 0 0 5.373 0 12h4zm2 5.291A7.962 7.962 0 014 12H0c0 3.042 1.135 5.824 3 7.938l3-2.647z"
23 |     ></path>
24 |   </svg>
25 | );
26 | 
27 | export const LoadingView: React.FC = () => {
28 |   return (
29 |     <div className="flex flex-col items-center justify-center h-full space-y-4">
30 |       <Spinner />
31 |       <p className="text-sm text-muted-foreground">Loading workflow data...</p>
32 |     </div>
33 |   );
34 | };
35 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/components/recording-view.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { useWorkflow } from "../context/workflow-provider";
 3 | import { Button } from "@/components/ui/button";
 4 | import { EventViewer } from "./event-viewer"; // Import EventViewer
 5 | 
 6 | export const RecordingView: React.FC = () => {
 7 |   const { stopRecording, workflow } = useWorkflow();
 8 |   const stepCount = workflow?.steps?.length || 0;
 9 | 
10 |   return (
11 |     <div className="flex flex-col h-full">
12 |       <div className="flex items-center justify-between p-4 border-b border-border">
13 |         <div className="flex items-center space-x-2">
14 |           <span className="relative flex h-3 w-3">
15 |             <span className="animate-ping absolute inline-flex h-full w-full rounded-full bg-red-400 opacity-75"></span>
16 |             <span className="relative inline-flex rounded-full h-3 w-3 bg-red-500"></span>
17 |           </span>
18 |           <span className="text-sm font-medium">
19 |             Recording ({stepCount} steps)
20 |           </span>
21 |         </div>
22 |         <Button variant="destructive" size="sm" onClick={stopRecording}>
23 |           Stop Recording
24 |         </Button>
25 |       </div>
26 |       <div className="flex-grow overflow-hidden p-4">
27 |         {/* EventViewer will now take full available space within this div */}
28 |         <EventViewer />
29 |       </div>
30 |     </div>
31 |   );
32 | };
33 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/components/stopped-view.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { useWorkflow } from "../context/workflow-provider";
 3 | import { Button } from "@/components/ui/button";
 4 | import { EventViewer } from "./event-viewer";
 5 | 
 6 | export const StoppedView: React.FC = () => {
 7 |   const { discardAndStartNew, workflow } = useWorkflow();
 8 | 
 9 |   const downloadJson = () => {
10 |     if (!workflow) return;
11 | 
12 |     // Sanitize workflow name for filename
13 |     const safeName = workflow.name
14 |       ? workflow.name.replace(/[^a-z0-9\.\-\_]/gi, "_").toLowerCase()
15 |       : "workflow";
16 | 
17 |     const blob = new Blob([JSON.stringify(workflow, null, 2)], {
18 |       type: "application/json",
19 |     });
20 |     const url = URL.createObjectURL(blob);
21 |     const a = document.createElement("a");
22 |     a.href = url;
23 |     // Generate filename e.g., my_workflow_name_2023-10-27_10-30-00.json
24 |     const timestamp = new Date()
25 |       .toISOString()
26 |       .replace(/[:.]/g, "-")
27 |       .slice(0, 19);
28 |     // Use sanitized name instead of domain
29 |     a.download = `${safeName}_${timestamp}.json`;
30 |     document.body.appendChild(a);
31 |     a.click();
32 |     document.body.removeChild(a);
33 |     URL.revokeObjectURL(url);
34 |   };
35 | 
36 |   return (
37 |     <div className="flex flex-col h-full">
38 |       <div className="flex items-center justify-between p-4 border-b border-border">
39 |         <h2 className="text-lg font-semibold">Recording Finished</h2>
40 |         <div className="space-x-2">
41 |           <Button variant="outline" size="sm" onClick={discardAndStartNew}>
42 |             Discard & Start New
43 |           </Button>
44 |           <Button
45 |             size="sm"
46 |             onClick={downloadJson}
47 |             disabled={
48 |               !workflow || !workflow.steps || workflow.steps.length === 0
49 |             }
50 |           >
51 |             Download JSON
52 |           </Button>
53 |         </div>
54 |       </div>
55 |       <div className="flex-grow overflow-hidden p-4">
56 |         <EventViewer />
57 |       </div>
58 |     </div>
59 |   );
60 | };
61 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/context/workflow-provider.tsx:
--------------------------------------------------------------------------------
  1 | import React, {
  2 |   createContext,
  3 |   ReactNode,
  4 |   useCallback,
  5 |   useContext,
  6 |   useEffect,
  7 |   useState,
  8 | } from "react";
  9 | import { Workflow } from "../../../lib/workflow-types"; // Adjust path as needed
 10 | 
 11 | type WorkflowState = {
 12 |   workflow: Workflow | null;
 13 |   recordingStatus: string; // e.g., 'idle', 'recording', 'stopped', 'error'
 14 |   currentEventIndex: number;
 15 |   isLoading: boolean;
 16 |   error: string | null;
 17 | };
 18 | 
 19 | type WorkflowContextType = WorkflowState & {
 20 |   startRecording: () => void;
 21 |   stopRecording: () => void;
 22 |   discardAndStartNew: () => void;
 23 |   selectEvent: (index: number) => void;
 24 |   fetchWorkflowData: (isPolling?: boolean) => void; // Add optional flag
 25 | };
 26 | 
 27 | const WorkflowContext = createContext<WorkflowContextType | undefined>(
 28 |   undefined
 29 | );
 30 | 
 31 | interface WorkflowProviderProps {
 32 |   children: ReactNode;
 33 | }
 34 | 
 35 | const POLLING_INTERVAL = 2000; // Fetch every 2 seconds during recording
 36 | 
 37 | export const WorkflowProvider: React.FC<WorkflowProviderProps> = ({
 38 |   children,
 39 | }) => {
 40 |   const [workflow, setWorkflow] = useState<Workflow | null>(null);
 41 |   const [recordingStatus, setRecordingStatus] = useState<string>("idle"); // 'idle', 'recording', 'stopped', 'error'
 42 |   const [currentEventIndex, setCurrentEventIndex] = useState<number>(0);
 43 |   const [isLoading, setIsLoading] = useState<boolean>(true);
 44 |   const [error, setError] = useState<string | null>(null);
 45 | 
 46 |   const fetchWorkflowData = useCallback(async (isPolling: boolean = false) => {
 47 |     if (!isPolling) {
 48 |       setIsLoading(true);
 49 |     }
 50 |     try {
 51 |       const data = await chrome.runtime.sendMessage({
 52 |         type: "GET_RECORDING_DATA",
 53 |       });
 54 |       console.log(
 55 |         "Received workflow data from background (polling=" + isPolling + "):",
 56 |         data
 57 |       );
 58 |       if (data && data.workflow && data.recordingStatus) {
 59 |         // Always update workflow when fetching (polling or not)
 60 |         setWorkflow(data.workflow);
 61 | 
 62 |         // If NOT polling, update status and index based on fetched data
 63 |         // If polling, we primarily rely on the broadcast message for status changes
 64 |         if (!isPolling) {
 65 |           setRecordingStatus(data.recordingStatus);
 66 |           setCurrentEventIndex(
 67 |             data.workflow.steps ? data.workflow.steps.length - 1 : 0
 68 |           );
 69 |         } else {
 70 |           // If polling, ensure index is valid (e.g., after step deletion)
 71 |           // Only adjust index based on current workflow state from polling
 72 |           setCurrentEventIndex((prevIndex) =>
 73 |             Math.min(prevIndex, (data.workflow.steps?.length || 1) - 1)
 74 |           );
 75 |           // Do NOT set recordingStatus from polling fetch, wait for broadcast message
 76 |         }
 77 |         // Clear error on successful fetch
 78 |         setError(null);
 79 |       } else {
 80 |         console.warn(
 81 |           "Received invalid/incomplete data structure from GET_RECORDING_DATA"
 82 |         );
 83 |         if (!isPolling) {
 84 |           setWorkflow(null);
 85 |           setRecordingStatus("idle");
 86 |           setCurrentEventIndex(0);
 87 |         }
 88 |       }
 89 |     } catch (err: any) {
 90 |       console.error(
 91 |         "Error fetching workflow data (polling=" + isPolling + "):",
 92 |         err
 93 |       );
 94 |       // Only set error state if it wasn't a background poll error
 95 |       // and the status isn't already error
 96 |       if (!isPolling) {
 97 |         setError(`Failed to load workflow data: ${err.message}`);
 98 |         setRecordingStatus("error");
 99 |         setWorkflow(null);
100 |       }
101 |     } finally {
102 |       if (!isPolling) {
103 |         setIsLoading(false);
104 |       }
105 |     }
106 |     // Remove state dependencies to stabilize the function reference
107 |   }, []);
108 | 
109 |   useEffect(() => {
110 |     // Initial fetch on mount
111 |     fetchWorkflowData(false);
112 | 
113 |     // Listener for status updates pushed from the background script
114 |     const messageListener = (message: any, sender: any, sendResponse: any) => {
115 |       console.log("Sidepanel received message:", message);
116 |       if (message.type === "recording_status_updated") {
117 |         console.log(
118 |           "Recording status updated message received:",
119 |           message.payload
120 |         );
121 |         const newStatus = message.payload.status;
122 |         // Use functional update to get previous status reliably
123 |         setRecordingStatus((prevStatus) => {
124 |           // If status changed from non-stopped/idle to stopped or idle, fetch final data
125 |           if (
126 |             newStatus !== prevStatus &&
127 |             (newStatus === "stopped" || newStatus === "idle")
128 |           ) {
129 |             fetchWorkflowData(false); // Fetch final data, show loading
130 |           }
131 |           return newStatus; // Return the new status to update the state
132 |         });
133 |       }
134 |     };
135 |     chrome.runtime.onMessage.addListener(messageListener);
136 | 
137 |     // --- Polling Logic ---
138 |     let pollingIntervalId: NodeJS.Timeout | null = null;
139 |     if (recordingStatus === "recording") {
140 |       pollingIntervalId = setInterval(() => {
141 |         fetchWorkflowData(true); // Fetch updates in the background (polling)
142 |       }, POLLING_INTERVAL);
143 |       console.log(`Polling started (Interval ID: ${pollingIntervalId})`);
144 |     }
145 |     // --- End Polling Logic ---
146 | 
147 |     // Cleanup listener and interval
148 |     return () => {
149 |       chrome.runtime.onMessage.removeListener(messageListener);
150 |       if (pollingIntervalId) {
151 |         clearInterval(pollingIntervalId);
152 |         console.log(
153 |           `Polling stopped (Cleared Interval ID: ${pollingIntervalId})`
154 |         );
155 |       }
156 |     };
157 |     // Keep dependencies: fetchWorkflowData is stable now,
158 |     // recordingStatus dependency correctly handles interval setup/teardown.
159 |   }, [fetchWorkflowData, recordingStatus]);
160 | 
161 |   // startRecording, stopRecording, discardAndStartNew, selectEvent remain largely the same
162 |   // but ensure isLoading is handled appropriately
163 |   const startRecording = useCallback(() => {
164 |     setError(null);
165 |     setIsLoading(true);
166 |     chrome.runtime.sendMessage({ type: "START_RECORDING" }, (response) => {
167 |       // Loading state will be turned off by the fetchWorkflowData triggered
168 |       // by the recording_status_updated message, or on error here.
169 |       if (chrome.runtime.lastError) {
170 |         console.error("Error starting recording:", chrome.runtime.lastError);
171 |         setError(
172 |           `Failed to start recording: ${chrome.runtime.lastError.message}`
173 |         );
174 |         setRecordingStatus("error");
175 |         setIsLoading(false); // Stop loading on error
176 |       } else {
177 |         console.log("Start recording acknowledged by background.");
178 |         // State updates happen via broadcast + fetch
179 |       }
180 |     });
181 |   }, []); // No dependencies needed
182 | 
183 |   const stopRecording = useCallback(() => {
184 |     setError(null);
185 |     setIsLoading(true);
186 |     chrome.runtime.sendMessage({ type: "STOP_RECORDING" }, (response) => {
187 |       // Loading state will be turned off by the fetchWorkflowData triggered
188 |       // by the recording_status_updated message, or on error here.
189 |       if (chrome.runtime.lastError) {
190 |         console.error("Error stopping recording:", chrome.runtime.lastError);
191 |         setError(
192 |           `Failed to stop recording: ${chrome.runtime.lastError.message}`
193 |         );
194 |         setRecordingStatus("error");
195 |         setIsLoading(false); // Stop loading on error
196 |       } else {
197 |         console.log("Stop recording acknowledged by background.");
198 |         // State updates happen via broadcast + fetch
199 |       }
200 |     });
201 |   }, []); // No dependencies needed
202 | 
203 |   const discardAndStartNew = useCallback(() => {
204 |     startRecording();
205 |   }, [startRecording]);
206 | 
207 |   const selectEvent = useCallback((index: number) => {
208 |     setCurrentEventIndex(index);
209 |   }, []);
210 | 
211 |   const value = {
212 |     workflow,
213 |     recordingStatus,
214 |     currentEventIndex,
215 |     isLoading,
216 |     error,
217 |     startRecording,
218 |     stopRecording,
219 |     discardAndStartNew,
220 |     selectEvent,
221 |     fetchWorkflowData,
222 |   };
223 | 
224 |   return (
225 |     <WorkflowContext.Provider value={value}>
226 |       {children}
227 |     </WorkflowContext.Provider>
228 |   );
229 | };
230 | 
231 | export const useWorkflow = (): WorkflowContextType => {
232 |   const context = useContext(WorkflowContext);
233 |   if (context === undefined) {
234 |     throw new Error("useWorkflow must be used within a WorkflowProvider");
235 |   }
236 |   return context;
237 | };
238 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/index.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
 6 |     <title>Default Popup Title</title>
 7 |     <meta name="manifest.type" content="browser_action" />
 8 | 
 9 |     <!-- Customize the manifest options -->
10 |     <meta name="manifest.open_at_install" content="true" />
11 |     <!-- <meta name="manifest.browser_style" content="true|false" /> -->
12 |   </head>
13 |   <body>
14 |     <div id="root"></div>
15 |     <script type="module" src="./index.tsx"></script>
16 |   </body>
17 | </html>
18 | 


--------------------------------------------------------------------------------
/extension/src/entrypoints/sidepanel/index.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import ReactDOM from "react-dom/client";
 3 | 
 4 | // import vite tailwind css
 5 | import "@/assets/tailwind.css";
 6 | 
 7 | import { ErrorView } from "./components/error-view";
 8 | import { InitialView } from "./components/initial-view";
 9 | import { LoadingView } from "./components/logina-view";
10 | import { RecordingView } from "./components/recording-view";
11 | import { StoppedView } from "./components/stopped-view";
12 | import { WorkflowProvider, useWorkflow } from "./context/workflow-provider";
13 | 
14 | const AppContent: React.FC = () => {
15 |   const { recordingStatus, isLoading, error } = useWorkflow();
16 | 
17 |   if (isLoading) {
18 |     return <LoadingView />;
19 |   }
20 | 
21 |   if (error) {
22 |     return <ErrorView />;
23 |   }
24 | 
25 |   switch (recordingStatus) {
26 |     case "recording":
27 |       return <RecordingView />;
28 |     case "stopped":
29 |       return <StoppedView />;
30 |     case "idle":
31 |     default:
32 |       return <InitialView />;
33 |   }
34 | };
35 | 
36 | const SidepanelApp: React.FC = () => {
37 |   return (
38 |     <React.StrictMode>
39 |       <WorkflowProvider>
40 |         <div className="h-screen flex flex-col">
41 |           <main className="flex-grow overflow-auto">
42 |             <AppContent />
43 |           </main>
44 |         </div>
45 |       </WorkflowProvider>
46 |     </React.StrictMode>
47 |   );
48 | };
49 | 
50 | const rootElement = document.getElementById("root");
51 | if (!rootElement) {
52 |   throw new Error("Root element not found");
53 | }
54 | 
55 | const root = ReactDOM.createRoot(rootElement);
56 | root.render(<SidepanelApp />);
57 | 


--------------------------------------------------------------------------------
/extension/src/lib/message-bus-types.ts:
--------------------------------------------------------------------------------
 1 | import { Workflow } from "./workflow-types"; // Assuming Workflow is in this path
 2 | 
 3 | // Types for events sent via HTTP to the Python server
 4 | 
 5 | export interface HttpWorkflowUpdateEvent {
 6 |   type: "WORKFLOW_UPDATE";
 7 |   timestamp: number;
 8 |   payload: Workflow;
 9 | }
10 | 
11 | export interface HttpRecordingStartedEvent {
12 |   type: "RECORDING_STARTED";
13 |   timestamp: number;
14 |   payload: {
15 |     message: string;
16 |   };
17 | }
18 | 
19 | export interface HttpRecordingStoppedEvent {
20 |   type: "RECORDING_STOPPED";
21 |   timestamp: number;
22 |   payload: {
23 |     message: string;
24 |   };
25 | }
26 | 
27 | // If you plan to send other types of events, like TERMINATE_COMMAND, define them here too
28 | // export interface HttpTerminateCommandEvent {
29 | //   type: "TERMINATE_COMMAND";
30 | //   timestamp: number;
31 | //   payload: {
32 | //     reason?: string; // Optional reason for termination
33 | //   };
34 | // }
35 | 
36 | export type HttpEvent =
37 |   | HttpWorkflowUpdateEvent
38 |   | HttpRecordingStartedEvent
39 |   | HttpRecordingStoppedEvent;
40 | // | HttpTerminateCommandEvent; // Add other event types to the union if defined
41 | 


--------------------------------------------------------------------------------
/extension/src/lib/types.ts:
--------------------------------------------------------------------------------
 1 | export interface StoredCustomClickEvent {
 2 |   timestamp: number;
 3 |   url: string;
 4 |   frameUrl: string;
 5 |   xpath: string;
 6 |   cssSelector?: string;
 7 |   elementTag: string;
 8 |   elementText: string;
 9 |   tabId: number;
10 |   messageType: "CUSTOM_CLICK_EVENT";
11 |   screenshot?: string;
12 | }
13 | 
14 | export interface StoredCustomInputEvent {
15 |   timestamp: number;
16 |   url: string;
17 |   frameUrl: string;
18 |   xpath: string;
19 |   cssSelector?: string;
20 |   elementTag: string;
21 |   value: string;
22 |   tabId: number;
23 |   messageType: "CUSTOM_INPUT_EVENT";
24 |   screenshot?: string;
25 | }
26 | 
27 | export interface StoredCustomSelectEvent {
28 |   timestamp: number;
29 |   url: string;
30 |   frameUrl: string;
31 |   xpath: string;
32 |   cssSelector?: string;
33 |   elementTag: string;
34 |   selectedValue: string;
35 |   selectedText: string;
36 |   tabId: number;
37 |   messageType: "CUSTOM_SELECT_EVENT";
38 |   screenshot?: string;
39 | }
40 | 
41 | export interface StoredCustomKeyEvent {
42 |   timestamp: number;
43 |   url: string;
44 |   frameUrl: string;
45 |   key: string;
46 |   xpath?: string; // XPath of focused element
47 |   cssSelector?: string;
48 |   elementTag?: string;
49 |   tabId: number;
50 |   messageType: "CUSTOM_KEY_EVENT";
51 |   screenshot?: string;
52 | }
53 | 
54 | export interface StoredTabEvent {
55 |   timestamp: number;
56 |   tabId: number;
57 |   messageType:
58 |     | "CUSTOM_TAB_CREATED"
59 |     | "CUSTOM_TAB_UPDATED"
60 |     | "CUSTOM_TAB_ACTIVATED"
61 |     | "CUSTOM_TAB_REMOVED";
62 |   url?: string;
63 |   openerTabId?: number;
64 |   windowId?: number;
65 |   changeInfo?: chrome.tabs.TabChangeInfo; // Relies on chrome types
66 |   isWindowClosing?: boolean;
67 |   index?: number;
68 |   title?: string;
69 | }
70 | 
71 | export interface StoredRrwebEvent {
72 |   type: number; // rrweb EventType (consider importing if needed)
73 |   data: any;
74 |   timestamp: number;
75 |   tabId: number;
76 |   messageType: "RRWEB_EVENT";
77 | }
78 | 
79 | export type StoredEvent =
80 |   | StoredCustomClickEvent
81 |   | StoredCustomInputEvent
82 |   | StoredCustomSelectEvent
83 |   | StoredCustomKeyEvent
84 |   | StoredTabEvent
85 |   | StoredRrwebEvent;
86 | 
87 | // --- Data Structures ---
88 | 
89 | export interface TabData {
90 |   info: { url?: string; title?: string };
91 |   events: StoredEvent[];
92 | }
93 | 
94 | export interface RecordingData {
95 |   [tabId: number]: TabData;
96 | }
97 | 


--------------------------------------------------------------------------------
/extension/src/lib/utils.ts:
--------------------------------------------------------------------------------
1 | import { clsx, type ClassValue } from "clsx"
2 | import { twMerge } from "tailwind-merge"
3 | 
4 | export function cn(...inputs: ClassValue[]) {
5 |   return twMerge(clsx(inputs))
6 | }
7 | 


--------------------------------------------------------------------------------
/extension/src/lib/workflow-types.ts:
--------------------------------------------------------------------------------
 1 | // --- Workflow Format ---
 2 | 
 3 | export interface Workflow {
 4 |   steps: Step[];
 5 |   name: string; // Consider how to populate these fields
 6 |   description: string; // Consider how to populate these fields
 7 |   version: string; // Consider how to populate these fields
 8 |   input_schema: [];
 9 | }
10 | 
11 | export type Step =
12 |   | NavigationStep
13 |   | ClickStep
14 |   | InputStep
15 |   | KeyPressStep
16 |   | ScrollStep;
17 | // Add other step types here as needed, e.g., SelectStep, TabCreatedStep etc.
18 | 
19 | export interface BaseStep {
20 |   type: string;
21 |   timestamp: number;
22 |   tabId: number;
23 |   url?: string; // Made optional as not all original events have it directly
24 | }
25 | 
26 | export interface NavigationStep extends BaseStep {
27 |   type: "navigation";
28 |   url: string; // Navigation implies a URL change
29 |   screenshot?: string; // Optional in source
30 | }
31 | 
32 | export interface ClickStep extends BaseStep {
33 |   type: "click";
34 |   url: string;
35 |   frameUrl: string;
36 |   xpath: string;
37 |   cssSelector?: string; // Optional in source
38 |   elementTag: string;
39 |   elementText: string;
40 |   screenshot?: string; // Optional in source
41 | }
42 | 
43 | export interface InputStep extends BaseStep {
44 |   type: "input";
45 |   url: string;
46 |   frameUrl: string;
47 |   xpath: string;
48 |   cssSelector?: string; // Optional in source
49 |   elementTag: string;
50 |   value: string;
51 |   screenshot?: string; // Optional in source
52 | }
53 | 
54 | export interface KeyPressStep extends BaseStep {
55 |   type: "key_press";
56 |   url?: string; // Can be missing if key press happens without element focus? Source is optional.
57 |   frameUrl?: string; // Might be missing
58 |   key: string;
59 |   xpath?: string; // Optional in source
60 |   cssSelector?: string; // Optional in source
61 |   elementTag?: string; // Optional in source
62 |   screenshot?: string; // Optional in source
63 | }
64 | 
65 | export interface ScrollStep extends BaseStep {
66 |   type: "scroll"; // Changed from scroll_update for simplicity
67 |   targetId: number; // The rrweb ID of the element being scrolled
68 |   scrollX: number;
69 |   scrollY: number;
70 |   // Note: url might be missing if scroll happens on initial load before meta event?
71 | }
72 | 
73 | // Potential future step types based on StoredEvent
74 | // export interface SelectStep extends BaseStep { ... }
75 | // export interface TabCreatedStep extends BaseStep { ... }
76 | // export interface TabActivatedStep extends BaseStep { ... }
77 | // export interface TabRemovedStep extends BaseStep { ... }
78 | 


--------------------------------------------------------------------------------
/extension/src/public/icon/128.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/browser-use/workflow-use/fc823f70f1996c12f18a818a9676aac674daa154/extension/src/public/icon/128.png


--------------------------------------------------------------------------------
/extension/src/public/icon/16.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/browser-use/workflow-use/fc823f70f1996c12f18a818a9676aac674daa154/extension/src/public/icon/16.png


--------------------------------------------------------------------------------
/extension/src/public/icon/32.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/browser-use/workflow-use/fc823f70f1996c12f18a818a9676aac674daa154/extension/src/public/icon/32.png


--------------------------------------------------------------------------------
/extension/src/public/icon/48.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/browser-use/workflow-use/fc823f70f1996c12f18a818a9676aac674daa154/extension/src/public/icon/48.png


--------------------------------------------------------------------------------
/extension/src/public/wxt.svg:
--------------------------------------------------------------------------------
 1 | <svg width="72" height="72" viewBox="0 0 72 72" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <g clip-path="url(#clip0_305_516)">
 3 | <g clip-path="url(#clip1_305_516)">
 4 | <path d="M49.0229 69.1875C54.1272 69.1875 58.265 65.0497 58.265 59.9454V50.7033H59.9454C65.0497 50.7033 69.1875 46.5655 69.1875 41.4612C69.1875 36.357 65.0497 32.2191 59.9454 32.2191H58.265V22.9771C58.265 17.8728 54.1272 13.735 49.0229 13.735H39.7809V12.0546C39.7809 6.95032 35.643 2.8125 30.5388 2.8125C25.4345 2.8125 21.2967 6.95032 21.2967 12.0546V13.735H12.0546C6.95032 13.735 2.8125 17.8728 2.8125 22.9771V32.2191H4.49288C9.59714 32.2191 13.735 36.357 13.735 41.4612C13.735 46.5655 9.59714 50.7033 4.49288 50.7033H2.8125V69.1875H21.2967V67.5071C21.2967 62.4029 25.4345 58.265 30.5388 58.265C35.643 58.265 39.7809 62.4029 39.7809 67.5071V69.1875H49.0229Z" stroke="#67D55E" stroke-width="5.625"/>
 5 | </g>
 6 | </g>
 7 | <defs>
 8 | <clipPath id="clip0_305_516">
 9 | <rect width="72" height="72" fill="white"/>
10 | </clipPath>
11 | <clipPath id="clip1_305_516">
12 | <rect width="72" height="72" fill="white"/>
13 | </clipPath>
14 | </defs>
15 | </svg>
16 | 


--------------------------------------------------------------------------------
/extension/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "extends": "./.wxt/tsconfig.json",
 3 |   "compilerOptions": {
 4 |     "allowImportingTsExtensions": true,
 5 |     "jsx": "react-jsx",
 6 |     "baseUrl": ".",
 7 |     "paths": {
 8 |       "@/*": [
 9 |         "./src/*"
10 |       ]
11 |     }
12 |   }
13 | }


--------------------------------------------------------------------------------
/extension/vite.config.ts:
--------------------------------------------------------------------------------
 1 | // vite.config.ts
 2 | import { defineConfig } from "vite";
 3 | import path from "path";
 4 | import tailwindcss from "@tailwindcss/vite";
 5 | 
 6 | export default defineConfig({
 7 |   plugins: [tailwindcss()],
 8 |   resolve: {
 9 |     alias: {
10 |       "@": path.resolve(__dirname, "./src/"),
11 |     },
12 |   },
13 | });
14 | 


--------------------------------------------------------------------------------
/extension/wxt.config.ts:
--------------------------------------------------------------------------------
 1 | // wxt.config.ts
 2 | import { defineConfig } from "wxt";
 3 | import baseViteConfig from "./vite.config";
 4 | 
 5 | import { mergeConfig } from "vite";
 6 | 
 7 | // See https://wxt.dev/api/config.html
 8 | export default defineConfig({
 9 |   modules: ["@wxt-dev/module-react"],
10 |   srcDir: "src",
11 |   vite: () =>
12 |     mergeConfig(baseViteConfig, {
13 |       // WXT-specific overrides (optional)
14 |     }),
15 |   manifest: {
16 |     permissions: ["tabs", "sidePanel", "<all_urls>"],
17 |     host_permissions: ["http://127.0.0.1/*"],
18 |     // options_page: "options.html",
19 |     // action: {
20 |     //   default_popup: "popup.html",
21 |     // },
22 |   },
23 | });
24 | 


--------------------------------------------------------------------------------
/static/workflow-use.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/browser-use/workflow-use/fc823f70f1996c12f18a818a9676aac674daa154/static/workflow-use.png


--------------------------------------------------------------------------------
/ui/.eslintrc.cjs:
--------------------------------------------------------------------------------
 1 | module.exports = {
 2 |   root: true,
 3 |   env: { browser: true, es2020: true },
 4 |   extends: [
 5 |     'eslint:recommended',
 6 |     'plugin:@typescript-eslint/recommended',
 7 |     'plugin:react-hooks/recommended',
 8 |   ],
 9 |   ignorePatterns: ['dist', '.eslintrc.cjs'],
10 |   parser: '@typescript-eslint/parser',
11 |   plugins: ['react-refresh'],
12 |   rules: {
13 |     'react-refresh/only-export-components': [
14 |       'warn',
15 |       { allowConstantExport: true },
16 |     ],
17 |   },
18 | }
19 | 


--------------------------------------------------------------------------------
/ui/.github/dependabot.yml:
--------------------------------------------------------------------------------
 1 | # docs:
 2 | # https://docs.github.com/code-security/dependabot/dependabot-version-updates/configuration-options-for-the-dependabot.yml-file
 3 | 
 4 | version: 2
 5 | updates:
 6 |   - package-ecosystem: 'npm'
 7 |     directory: '/'
 8 |     schedule:
 9 |       interval: 'daily'
10 |     allow:
11 |       - dependency-name: '@xyflow/react'
12 | 


--------------------------------------------------------------------------------
/ui/.gitignore:
--------------------------------------------------------------------------------
 1 | # Logs
 2 | logs
 3 | *.log
 4 | npm-debug.log*
 5 | yarn-debug.log*
 6 | yarn-error.log*
 7 | pnpm-debug.log*
 8 | lerna-debug.log*
 9 | 
10 | node_modules
11 | dist
12 | dist-ssr
13 | *.local
14 | 
15 | # Editor directories and files
16 | .vscode/*
17 | !.vscode/extensions.json
18 | .idea
19 | .DS_Store
20 | *.suo
21 | *.ntvs*
22 | *.njsproj
23 | *.sln
24 | *.sw?
25 | 
26 | src/lib/api/apigen.d.ts
27 | 


--------------------------------------------------------------------------------
/ui/index.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <link rel="icon" href="/browseruse.png" />
 6 |     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
 7 |     <title>Browser Use Workflow Visualizer</title>
 8 |   </head>
 9 |   <body>
10 |     <div id="root"></div>
11 |     <script type="module" src="/src/main.tsx"></script>
12 |   </body>
13 | </html>
14 | 


--------------------------------------------------------------------------------
/ui/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "workflow-use-ui",
 3 |   "version": "0.0.0",
 4 |   "type": "module",
 5 |   "scripts": {
 6 |     "dev": "vite",
 7 |     "build": "tsc && vite build",
 8 |     "lint": "eslint . --ext ts,tsx --report-unused-disable-directives --max-warnings 0",
 9 |     "preview": "vite preview",
10 |     "get-openapi": "curl http://localhost:${BACKEND_PORT:-8000}/openapi.json -o ./src/lib/api/openapi.json",
11 |     "type-gen": "npx openapi-typescript ./src/lib/api/openapi.json -o ./src/lib/api/apigen.d.ts",
12 |     "type-gen-update": "rm -rf ./src/lib/api/apigen.d.ts && npm run get-openapi && npm run type-gen",
13 |     "postinstall": "test -n \"$NOYARNPOSTINSTALL\" || npm run type-gen"
14 |   },
15 |   "dependencies": {
16 |     "@tailwindcss/vite": "^4.1.7",
17 |     "@xyflow/react": "^12.5.1",
18 |     "openapi-fetch": "^0.14.0",
19 |     "openapi-react-query": "^0.5.0",
20 |     "react": "^18.2.0",
21 |     "react-dom": "^18.2.0",
22 |     "tailwindcss": "^4.1.7",
23 |     "zod": "^3.24.4"
24 |   },
25 |   "devDependencies": {
26 |     "@types/node": "^22.15.19",
27 |     "@types/react": "^18.2.53",
28 |     "@types/react-dom": "^18.2.18",
29 |     "@typescript-eslint/eslint-plugin": "^6.20.0",
30 |     "@typescript-eslint/parser": "^6.20.0",
31 |     "@vitejs/plugin-react": "^4.2.1",
32 |     "eslint": "^8.56.0",
33 |     "eslint-plugin-react-hooks": "^4.6.0",
34 |     "eslint-plugin-react-refresh": "^0.4.5",
35 |     "openapi-typescript": "^7.8.0",
36 |     "typescript": "^5.3.3",
37 |     "vite": "^5.0.12"
38 |   }
39 | }
40 | 


--------------------------------------------------------------------------------
/ui/public/browseruse.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/browser-use/workflow-use/fc823f70f1996c12f18a818a9676aac674daa154/ui/public/browseruse.png


--------------------------------------------------------------------------------
/ui/public/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/browser-use/workflow-use/fc823f70f1996c12f18a818a9676aac674daa154/ui/public/favicon.ico


--------------------------------------------------------------------------------
/ui/src/App.tsx:
--------------------------------------------------------------------------------
 1 | import { ReactFlowProvider } from "@xyflow/react";
 2 | import "@xyflow/react/dist/style.css";
 3 | import WorkflowLayout from "./components/workflow-layout";
 4 | import { QueryClient, QueryClientProvider } from "@tanstack/react-query";
 5 | 
 6 | // Create a client
 7 | const queryClient = new QueryClient();
 8 | 
 9 | export default function App() {
10 |   return (
11 |     <QueryClientProvider client={queryClient}>
12 |       <ReactFlowProvider>
13 |         <WorkflowLayout />
14 |       </ReactFlowProvider>
15 |     </QueryClientProvider>
16 |   );
17 | }
18 | 


--------------------------------------------------------------------------------
/ui/src/components/log-viewer.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useState, useEffect, useRef } from "react";
  2 | import { LogViewerProps } from "../types/log-viewer.types";
  3 | 
  4 | const LogViewer: React.FC<LogViewerProps> = ({
  5 |   taskId,
  6 |   initialPosition,
  7 |   onStatusChange,
  8 |   onError,
  9 |   onCancel,
 10 |   onClose,
 11 | }) => {
 12 |   const [isCancelling, setIsCancelling] = useState<boolean>(false);
 13 |   const [logs, setLogs] = useState<string[]>([]);
 14 |   const [position, setPosition] = useState<number>(initialPosition);
 15 |   const [status, setStatus] = useState<string>("running");
 16 |   const [error, setError] = useState<string | null>(null);
 17 |   const [polling, setPolling] = useState<boolean>(true);
 18 | 
 19 |   const logContainerRef = useRef<HTMLDivElement>(null);
 20 |   const pollingIntervalRef = useRef<NodeJS.Timeout | null>(null);
 21 | 
 22 |   useEffect(() => {
 23 |     if (logContainerRef.current) {
 24 |       logContainerRef.current.scrollTop = logContainerRef.current.scrollHeight;
 25 |     }
 26 |   }, [logs]);
 27 | 
 28 |   useEffect(() => {
 29 |     return () => {
 30 |       setPolling(false);
 31 |     };
 32 |   }, []);
 33 | 
 34 |   useEffect(() => {
 35 |     if (!taskId) return;
 36 | 
 37 |     const pollLogs = async () => {
 38 |       try {
 39 |         const response = await fetch(
 40 |           `http://127.0.0.1:8000/api/workflows/logs/${taskId}?position=${position}`
 41 |         );
 42 | 
 43 |         if (!response.ok) {
 44 |           throw new Error(`Error fetching logs: ${response.status}`);
 45 |         }
 46 | 
 47 |         const data = await response.json();
 48 | 
 49 |         if (data.logs && data.logs.length > 0) {
 50 |           setLogs((prevLogs) => [...prevLogs, ...data.logs]);
 51 |         }
 52 | 
 53 |         setPosition(data.log_position);
 54 | 
 55 |         if (data.status && data.status !== status) {
 56 |           setStatus(data.status);
 57 |           onStatusChange?.(data.status);
 58 | 
 59 |           if (data.status === "failed" && data.error) {
 60 |             setError(data.error);
 61 |             onError?.(data.error);
 62 |           }
 63 |         }
 64 |       } catch (err) {
 65 |         console.error("Error polling logs:", err);
 66 |       }
 67 |     };
 68 | 
 69 |     pollLogs();
 70 | 
 71 |     pollingIntervalRef.current = setInterval(() => {
 72 |       if (polling) {
 73 |         pollLogs();
 74 |       }
 75 |     }, 2000);
 76 | 
 77 |     return () => {
 78 |       if (pollingIntervalRef.current) {
 79 |         clearInterval(pollingIntervalRef.current);
 80 |       }
 81 |     };
 82 |   }, [taskId, position, status, polling, onStatusChange, onError]);
 83 | 
 84 |   const cancelWorkflow = async () => {
 85 |     if (!taskId || isCancelling || status !== "running") return;
 86 | 
 87 |     setIsCancelling(true);
 88 | 
 89 |     try {
 90 |       const response = await fetch(
 91 |         `http://127.0.0.1:8000/api/workflows/tasks/${taskId}/cancel`,
 92 |         {
 93 |           method: "POST",
 94 |           headers: {
 95 |             "Content-Type": "application/json",
 96 |           },
 97 |         }
 98 |       );
 99 | 
100 |       const data = await response.json();
101 | 
102 |       if (response.ok && data.success) {
103 |         // The status will be updated through the polling mechanism
104 |         if (onCancel) {
105 |           onCancel();
106 |         }
107 |       } else {
108 |         console.error(
109 |           "Failed to cancel workflow:",
110 |           data.message || "Unknown error"
111 |         );
112 |       }
113 |     } catch (err) {
114 |       console.error("Error cancelling workflow:", err);
115 |     } finally {
116 |       setIsCancelling(false);
117 |     }
118 |   };
119 | 
120 |   const downloadLogs = () => {
121 |     if (logs.length === 0) return;
122 | 
123 |     const textContent = logs.join("");
124 | 
125 |     const blob = new Blob([textContent], { type: "text/plain" });
126 | 
127 |     const url = URL.createObjectURL(blob);
128 | 
129 |     const link = document.createElement("a");
130 |     link.href = url;
131 |     link.download = taskId
132 |       ? `workflow-logs-${taskId}.txt`
133 |       : "workflow-logs.txt";
134 | 
135 |     document.body.appendChild(link);
136 |     link.click();
137 |     document.body.removeChild(link);
138 | 
139 |     URL.revokeObjectURL(url);
140 |   };
141 | 
142 |   const formatLog = (log: string, index: number) => {
143 |     const timestampMatch = log.match(/^\[(.*?)\]/);
144 | 
145 |     if (timestampMatch) {
146 |       const timestamp = timestampMatch[0];
147 |       const message = log.substring(timestamp.length);
148 | 
149 |       return (
150 |         <div key={index} className="log-line">
151 |           <span className="log-timestamp">{timestamp}</span>
152 |           <span className="log-message">{message}</span>
153 |         </div>
154 |       );
155 |     }
156 | 
157 |     return (
158 |       <div key={index} className="log-line">
159 |         {log}
160 |       </div>
161 |     );
162 |   };
163 | 
164 |   return (
165 |     <div className="w-full h-[350px] flex flex-col border border-[#ddd] rounded-md overflow-hidden my-4 bg-[#f8f9fa] font-mono">
166 |       <div className="flex justify-between p-2 bg-[#f0f2f5] border-b border-[#ddd]">
167 |         <div className="font-semibold text-[#333]">Workflow Execution Logs</div>
168 |         <div className="flex items-center gap-2.5">
169 |           <div className="flex items-center gap-2">
170 |             {status === "running" && (
171 |               <button
172 |                 className={`flex items-center gap-1 py-1 px-2 bg-[#fff2f0] border border-[#ffccc7] rounded text-xs cursor-pointer text-[#ff4d4f] transition-all hover:bg-[#fff1f0] hover:border-[#ffa39e] ${
173 |                   isCancelling ? "opacity-60 cursor-not-allowed" : ""
174 |                 }`}
175 |                 onClick={cancelWorkflow}
176 |                 disabled={isCancelling}
177 |                 title="Cancel workflow execution"
178 |               >
179 |                 <svg
180 |                   xmlns="http://www.w3.org/2000/svg"
181 |                   width="16"
182 |                   height="16"
183 |                   viewBox="0 0 24 24"
184 |                   fill="none"
185 |                   stroke="currentColor"
186 |                   strokeWidth="2"
187 |                   strokeLinecap="round"
188 |                   strokeLinejoin="round"
189 |                   className="w-3.5 h-3.5"
190 |                 >
191 |                   <circle cx="12" cy="12" r="10" />
192 |                   <line x1="15" y1="9" x2="9" y2="15" />
193 |                   <line x1="9" y1="9" x2="15" y2="15" />
194 |                 </svg>
195 |                 {isCancelling ? "Cancelling..." : "Cancel"}
196 |               </button>
197 |             )}
198 |             {logs.length > 0 && (
199 |               <button
200 |                 className="flex items-center gap-1 py-1 px-2 bg-[#f5f5f5] border border-[#ddd] rounded text-xs cursor-pointer text-[#333] transition-all hover:bg-[#e6e6e6] hover:border-[#ccc]"
201 |                 onClick={downloadLogs}
202 |                 title="Download logs as text file"
203 |               >
204 |                 <svg
205 |                   xmlns="http://www.w3.org/2000/svg"
206 |                   width="16"
207 |                   height="16"
208 |                   viewBox="0 0 24 24"
209 |                   fill="none"
210 |                   stroke="currentColor"
211 |                   strokeWidth="2"
212 |                   strokeLinecap="round"
213 |                   strokeLinejoin="round"
214 |                   className="w-3.5 h-3.5"
215 |                 >
216 |                   <path d="M21 15v4a2 2 0 0 1-2 2H5a2 2 0 0 1-2-2v-4" />
217 |                   <polyline points="7 10 12 15 17 10" />
218 |                   <line x1="12" y1="15" x2="12" y2="3" />
219 |                 </svg>
220 |                 Download
221 |               </button>
222 |             )}
223 |           </div>
224 |           <div
225 |             className={`py-0.5 px-2 rounded text-xs font-medium ${
226 |               status === "running"
227 |                 ? "bg-[#e6f7ff] text-[#1890ff] border border-[#91d5ff]"
228 |                 : status === "completed"
229 |                 ? "bg-[#f6ffed] text-[#52c41a] border border-[#b7eb8f]"
230 |                 : status === "cancelling"
231 |                 ? "bg-[#fff2f0] text-orange border border-[#ffccc7]"
232 |                 : status === "cancelled"
233 |                 ? "bg-[#fff2f0] text-[#ff4d4f] border border-[#ffccc7]"
234 |                 : status === "failed"
235 |                 ? "bg-[#fff2f0] text-[#ff4d4f] border border-[#ffccc7]"
236 |                 : "bg-[#fafafa] text-[#888] border border-[#ddd]"
237 |             }`}
238 |           >
239 |             Status: {status.charAt(0).toUpperCase() + status.slice(1)}
240 |           </div>
241 |         </div>
242 |       </div>
243 | 
244 |       <div
245 |         className="flex-1 overflow-y-auto p-3 text-xs leading-normal whitespace-pre-wrap break-words bg-white text-[#333]"
246 |         ref={logContainerRef}
247 |       >
248 |         {logs.length > 0 ? (
249 |           logs.map((log, index) => formatLog(log, index))
250 |         ) : (
251 |           <div className="text-[#999] italic py-5 text-center">
252 |             Waiting for logs...
253 |           </div>
254 |         )}
255 | 
256 |         {error && (
257 |           <div className="mt-2 p-2 rounded bg-[#fff2f0] text-[#ff4d4f] border border-[#ffccc7]">
258 |             <strong>Error:</strong> {error}
259 |           </div>
260 |         )}
261 |       </div>
262 | 
263 |       {/* Close button at the bottom */}
264 |       <div className="p-2.5 flex justify-center border-t border-[#ddd] bg-[#f0f2f5]">
265 |         <button
266 |           className="py-1.5 px-4 bg-[#f5f5f5] border border-[#ddd] rounded text-sm font-medium cursor-pointer text-[#333] transition-all hover:bg-[#e6e6e6] hover:border-[#ccc]"
267 |           onClick={onClose}
268 |           title="Close log viewer"
269 |         >
270 |           Close
271 |         </button>
272 |       </div>
273 |     </div>
274 |   );
275 | };
276 | 
277 | export default LogViewer;
278 | 


--------------------------------------------------------------------------------
/ui/src/components/no-workflow-message.tsx:
--------------------------------------------------------------------------------
 1 | import React from 'react';
 2 | 
 3 | const NoWorkflowsMessage: React.FC = () => {
 4 |   return (
 5 |     <div className="flex flex-col justify-center items-center h-screen bg-[#2a2a2a] text-white p-0 px-5 text-center">
 6 |       <img 
 7 |         src="/browseruse.png" 
 8 |         alt="Browser Use Logo" 
 9 |         className="w-[150px] h-auto mb-[30px]"
10 |       />
11 |       <h2 className="text-xl mb-[10px]">No Workflows Found</h2>
12 |       <p className="text-sm max-w-[500px] leading-normal mb-[10px]">
13 |         To get started with Workflow Use, you need to first create a workflow 
14 |         or place an existing workflow file in the <code>workflows/tmp</code> folder.
15 |       </p>
16 |       <p className="text-sm max-w-[450px] leading-normal mb-[30px]">
17 |         Once you've added a workflow file, refresh this page to visualize and interact with it. For more information, checkout out the documentation below.
18 |       </p>
19 |       <a 
20 |         href="https://github.com/browser-use/workflow-use" 
21 |         target="_blank" 
22 |         rel="noopener noreferrer"
23 |         className="inline-block bg-blue-400 hover:bg-blue-500 text-white no-underline py-[10px] px-[20px] rounded font-bold text-base transition-colors"
24 |       >
25 |         Learn More
26 |       </a>
27 |     </div>
28 |   );
29 | };
30 | 
31 | export default NoWorkflowsMessage;
32 | 


--------------------------------------------------------------------------------
/ui/src/components/play-button.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useState } from "react";
  2 | import LogViewer from "./log-viewer";
  3 | import { PlayButtonProps, InputField } from "../types/play-button.types";
  4 | 
  5 | export const PlayButton: React.FC<PlayButtonProps> = ({
  6 |   workflowName,
  7 |   workflowMetadata,
  8 | }) => {
  9 |   const [showModal, setShowModal] = useState<boolean>(false);
 10 |   const [showLogViewer, setShowLogViewer] = useState<boolean>(false);
 11 |   const [isRunning, setIsRunning] = useState<boolean>(false);
 12 |   const [error, setError] = useState<string | null>(null);
 13 |   const [inputFields, setInputFields] = useState<InputField[]>([]);
 14 |   const [taskId, setTaskId] = useState<string | null>(null);
 15 |   const [logPosition, setLogPosition] = useState<number>(0);
 16 |   const [workflowStatus, setWorkflowStatus] = useState<string>("idle");
 17 | 
 18 |   const openModal = () => {
 19 |     if (!workflowName) return;
 20 | 
 21 |     setShowModal(true);
 22 |     setError(null);
 23 | 
 24 |     if (workflowMetadata && workflowMetadata.input_schema) {
 25 |       const fields = workflowMetadata.input_schema.map((input: any) => ({
 26 |         name: input.name,
 27 |         type: input.type,
 28 |         required: input.required,
 29 |         value: input.type === "boolean" ? false : "",
 30 |       }));
 31 |       setInputFields(fields);
 32 |     } else {
 33 |       setInputFields([]);
 34 |     }
 35 |   };
 36 | 
 37 |   const closeModal = () => {
 38 |     setShowModal(false);
 39 | 
 40 |     if (!isRunning) {
 41 |       resetState();
 42 |     }
 43 |   };
 44 | 
 45 |   const closeLogViewer = () => {
 46 |     setShowLogViewer(false);
 47 |     resetState();
 48 |   };
 49 | 
 50 |   const resetState = () => {
 51 |     setIsRunning(false);
 52 |     setError(null);
 53 |     setInputFields([]);
 54 |     setTaskId(null);
 55 |     setLogPosition(0);
 56 |     setWorkflowStatus("idle");
 57 |   };
 58 | 
 59 |   const handleInputChange = (index: number, value: any) => {
 60 |     const updatedFields = [...inputFields];
 61 |     if (updatedFields[index]) {
 62 |       updatedFields[index].value = value;
 63 |       setInputFields(updatedFields);
 64 |     }
 65 |   };
 66 | 
 67 |   const executeWorkflow = async () => {
 68 |     if (!workflowName) return;
 69 | 
 70 |     const missingInputs = inputFields.filter(
 71 |       (field) => field.required && !field.value
 72 |     );
 73 |     if (missingInputs.length > 0) {
 74 |       setError(
 75 |         `Missing required inputs: ${missingInputs
 76 |           .map((f) => f.name)
 77 |           .join(", ")}`
 78 |       );
 79 |       return;
 80 |     }
 81 | 
 82 |     setIsRunning(true);
 83 |     setError(null);
 84 |     setTaskId(null);
 85 |     setLogPosition(0);
 86 |     setWorkflowStatus("idle");
 87 | 
 88 |     try {
 89 |       const inputs: Record<string, any> = {};
 90 |       inputFields.forEach((field) => {
 91 |         inputs[field.name] = field.value;
 92 |       });
 93 | 
 94 |       const response = await fetch(
 95 |         "http://127.0.0.1:8000/api/workflows/execute",
 96 |         {
 97 |           method: "POST",
 98 |           headers: {
 99 |             "Content-Type": "application/json",
100 |           },
101 |           body: JSON.stringify({
102 |             name: workflowName,
103 |             inputs,
104 |           }),
105 |         }
106 |       );
107 | 
108 |       const data = await response.json();
109 |       setTaskId(data.task_id);
110 |       setLogPosition(data.log_position);
111 |       setIsRunning(true);
112 |       setShowLogViewer(true);
113 |       setShowModal(false);
114 |     } catch (err) {
115 |       console.error("Failed to execute workflow:", err);
116 |       setError("An error occurred while executing the workflow");
117 |     }
118 |   };
119 | 
120 |   const handleStatusChange = (status: string) => {
121 |     setWorkflowStatus(status);
122 | 
123 |     if (
124 |       status === "completed" ||
125 |       status === "failed" ||
126 |       status === "cancelled"
127 |     ) {
128 |       setIsRunning(false);
129 |     }
130 |   };
131 | 
132 |   const handleCancelWorkflow = () => {
133 |     setWorkflowStatus("cancelling");
134 |   };
135 | 
136 |   const handleWorkflowError = (errorMessage: string) => {
137 |     setError(errorMessage);
138 |   };
139 | 
140 |   if (!workflowName) return null;
141 | 
142 |   return (
143 |     <div>
144 |       {/* play button */}
145 |       <button
146 |         title="Execute workflow"
147 |         onClick={openModal}
148 |         className="z-10 flex h-9 w-9 items-center justify-center rounded-full bg-[#2a2a2a] text-white shadow transition-transform duration-200 ease-in-out hover:scale-105 hover:bg-blue-500"
149 |       >
150 |         ▶
151 |       </button>
152 | 
153 |       {/* parameter‑input modal */}
154 |       {showModal && (
155 |         <div className="fixed inset-0 z-[1000] flex items-center justify-center bg-black/50">
156 |           <div className="flex max-h-[80vh] w-[600px] max-w-[80vw] flex-col overflow-hidden rounded-lg bg-[#2a2a2a] text-white shadow-2xl">
157 |             {/* header */}
158 |             <div className="flex items-center justify-between border-b border-gray-700 p-4">
159 |               <h3 className="m-0 text-lg">
160 |                 Execute Workflow: {workflowMetadata?.name || workflowName}
161 |               </h3>
162 |               <button
163 |                 onClick={closeModal}
164 |                 className="text-2xl text-gray-400 hover:text-white"
165 |               >
166 |                 ×
167 |               </button>
168 |             </div>
169 | 
170 |             {/* content */}
171 |             <div className="flex-1 overflow-y-auto p-4">
172 |               {error && (
173 |                 <div className="mb-4 rounded bg-red-800/20 p-2 text-red-300">
174 |                   {error}
175 |                 </div>
176 |               )}
177 | 
178 |               {inputFields.length ? (
179 |                 <div className="mb-5">
180 |                   <h4 className="mb-3 mt-0 text-base text-gray-300">
181 |                     Input Parameters
182 |                   </h4>
183 | 
184 |                   {inputFields.map((f, i) => (
185 |                     <div key={f.name} className="mb-3">
186 |                       <label className="mb-1 block text-sm text-gray-300">
187 |                         {f.name}
188 |                         {f.required && (
189 |                           <span className="ml-1 text-red-400">*</span>
190 |                         )}
191 |                         <span className="ml-1 text-xs text-gray-500">
192 |                           ({f.type})
193 |                         </span>
194 |                       </label>
195 | 
196 |                       {f.type === "boolean" ? (
197 |                         <input
198 |                           type="checkbox"
199 |                           checked={f.value as boolean}
200 |                           onChange={(e) =>
201 |                             handleInputChange(i, e.target.checked)
202 |                           }
203 |                         />
204 |                       ) : (
205 |                         <input
206 |                           type={f.type === "number" ? "number" : "text"}
207 |                           value={f.value as string | number}
208 |                           onChange={(e) => handleInputChange(i, e.target.value)}
209 |                           className="w-full rounded border border-gray-600 bg-[#333] px-3 py-2 text-sm text-white"
210 |                         />
211 |                       )}
212 |                     </div>
213 |                   ))}
214 |                 </div>
215 |               ) : (
216 |                 <p>No input parameters required for this workflow.</p>
217 |               )}
218 | 
219 |               <div className="mt-5 flex justify-end gap-3">
220 |                 <button
221 |                   onClick={closeModal}
222 |                   className="rounded bg-gray-600 px-4 py-2 text-sm text-white hover:bg-gray-500"
223 |                 >
224 |                   Cancel
225 |                 </button>
226 |                 <button
227 |                   onClick={executeWorkflow}
228 |                   disabled={isRunning}
229 |                   className="rounded bg-blue-400 px-4 py-2 text-sm text-white hover:bg-blue-500 disabled:cursor-not-allowed disabled:bg-gray-600 disabled:opacity-70"
230 |                 >
231 |                   Execute Workflow
232 |                 </button>
233 |               </div>
234 |             </div>
235 |           </div>
236 |         </div>
237 |       )}
238 | 
239 |       {/* log viewer */}
240 |       {showLogViewer && taskId && (
241 |         <div className="fixed inset-0 z-[1000] flex items-center justify-center bg-black/50">
242 |           <div className="flex max-h-[80vh] w-[650px] max-w-[80vw] flex-col overflow-hidden rounded-lg bg-[#2a2a2a] text-white shadow-2xl">
243 |             <div className="flex items-center justify-between border-b border-gray-700 p-4">
244 |               <div>
245 |                 Workflow Execution
246 |                 {workflowStatus !== "running" &&
247 |                   ` (${workflowStatus
248 |                     .charAt(0)
249 |                     .toUpperCase()}${workflowStatus.slice(1)})`}
250 |               </div>
251 |             </div>
252 | 
253 |             <div className="flex-1 overflow-y-auto p-4">
254 |               <LogViewer
255 |                 taskId={taskId}
256 |                 initialPosition={logPosition}
257 |                 onStatusChange={handleStatusChange}
258 |                 onError={handleWorkflowError}
259 |                 onCancel={handleCancelWorkflow}
260 |                 onClose={closeLogViewer}
261 |               />
262 |             </div>
263 |           </div>
264 |         </div>
265 |       )}
266 |     </div>
267 |   );
268 | };
269 | 


--------------------------------------------------------------------------------
/ui/src/components/sidebar.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import WorkflowItem from "./workflow-item";
 3 | import { WorkflowMetadata } from "../types/workflow-layout.types";
 4 | 
 5 | interface SidebarProps {
 6 |   workflows: string[];
 7 |   onSelect: (workflow: string) => void;
 8 |   selected: string | null;
 9 |   workflowMetadata: WorkflowMetadata | null;
10 |   onUpdateMetadata: (metadata: WorkflowMetadata) => Promise<void>;
11 |   allWorkflowsMetadata?: Record<string, WorkflowMetadata>;
12 | }
13 | 
14 | export const Sidebar: React.FC<SidebarProps> = ({
15 |   workflows,
16 |   onSelect,
17 |   selected,
18 |   workflowMetadata,
19 |   onUpdateMetadata,
20 |   allWorkflowsMetadata = {},
21 | }) => (
22 |   <aside className="w-[250px] border-r border-[#542e2e] p-3 bg-[#2a2a2a] text-white flex flex-col overflow-auto">
23 |     {/* logo */}
24 |     <div className="flex justify-center mb-4">
25 |       <img
26 |         src="/browseruse.png"
27 |         alt="Browser Use Logo"
28 |         className="max-w-[80%] max-h-[60px]"
29 |       />
30 |     </div>
31 | 
32 |     <h3 className="text-lg text-[#ddd]">Workflows</h3>
33 | 
34 |     <ul className="m-0 p-0">
35 |       {workflows.map((id) => (
36 |         <WorkflowItem
37 |           key={id}
38 |           id={id}
39 |           selected={id === selected}
40 |           metadata={
41 |             id === selected
42 |               ? workflowMetadata ?? undefined
43 |               : allWorkflowsMetadata[id]
44 |           }
45 |           onSelect={onSelect}
46 |           onUpdateMetadata={onUpdateMetadata}
47 |         />
48 |       ))}
49 |     </ul>
50 |   </aside>
51 | );
52 | 
53 | export default Sidebar;
54 | 


--------------------------------------------------------------------------------
/ui/src/components/workflow-item.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useState, ChangeEvent } from "react";
  2 | import {
  3 |   WorkflowMetadata,
  4 |   WorkflowItemProps,
  5 | } from "../types/workflow-layout.types";
  6 | 
  7 | const WorkflowItem: React.FC<WorkflowItemProps> = ({
  8 |   id,
  9 |   selected,
 10 |   metadata,
 11 |   onSelect,
 12 |   onUpdateMetadata,
 13 | }) => {
 14 |   const [isEditing, setIsEditing] = useState(false);
 15 |   const [edited, setEdited] = useState<WorkflowMetadata | null>(null);
 16 |   const [submitting, setSubmitting] = useState(false);
 17 | 
 18 |   const displayName = () => {
 19 |     if (metadata)
 20 |       return (
 21 |         <>
 22 |           <span className="text-md">{metadata.name}</span>
 23 |           {metadata.version && (
 24 |             <span className="text-xs text-[#888] ml-1.5">
 25 |               v{metadata.version}
 26 |             </span>
 27 |           )}
 28 |         </>
 29 |       );
 30 | 
 31 |     return (
 32 |       <span className="text-[#ccc]">
 33 |         <span className="opacity-70">Loading workflow…</span>
 34 |         <span className="hidden">{id}</span>
 35 |       </span>
 36 |     );
 37 |   };
 38 | 
 39 |   const change =
 40 |     (field: keyof WorkflowMetadata) =>
 41 |     (e: ChangeEvent<HTMLInputElement | HTMLTextAreaElement>) =>
 42 |       edited && setEdited({ ...edited, [field]: e.target.value });
 43 | 
 44 |   const save = async () => {
 45 |     if (!edited) return;
 46 |     setSubmitting(true);
 47 |     await onUpdateMetadata(edited).finally(() => setSubmitting(false));
 48 |     setIsEditing(false);
 49 |   };
 50 | 
 51 |   const editForm = metadata && (
 52 |     <div>
 53 |       {(["name", "version"] as (keyof WorkflowMetadata)[]).map((f) => (
 54 |         <label key={f} className="block text-xs mb-2">
 55 |           <span className="block text-[#aaa] mb-1">
 56 |             {f[0]?.toUpperCase() + f.slice(1)}
 57 |           </span>
 58 |           <input
 59 |             className="w-full bg-[#333] border border-[#555] text-white p-1.5 rounded text-xs"
 60 |             value={edited?.[f] ?? ""}
 61 |             onChange={change(f)}
 62 |           />
 63 |         </label>
 64 |       ))}
 65 | 
 66 |       <label className="block text-xs mb-2">
 67 |         <span className="block text-[#aaa] mb-1">Description</span>
 68 |         <textarea
 69 |           className="w-full bg-[#333] border border-[#555] text-white p-1.5 rounded min-h-[60px] resize-y text-xs"
 70 |           value={edited?.description ?? ""}
 71 |           onChange={change("description")}
 72 |         />
 73 |       </label>
 74 | 
 75 |       <div className="flex gap-2 justify-end">
 76 |         <button
 77 |           onClick={() => setIsEditing(false)}
 78 |           className="bg-[#444] text-white py-1.5 px-3 rounded text-xs"
 79 |         >
 80 |           Cancel
 81 |         </button>
 82 |         <button
 83 |           disabled={submitting}
 84 |           onClick={save}
 85 |           className={`bg-blue-400 hover:bg-blue-500 text-white py-1.5 px-3 rounded text-xs ${
 86 |             submitting && "opacity-70"
 87 |           }`}
 88 |         >
 89 |           {submitting ? "Saving…" : "Save"}
 90 |         </button>
 91 |       </div>
 92 |     </div>
 93 |   );
 94 | 
 95 |   const readOnly = metadata && (
 96 |     <>
 97 |       <div className="mb-2">
 98 |         <div className="text-xs text-[#aaa] mb-1">Description</div>
 99 |         <div className="text-xs">{metadata.description}</div>
100 |       </div>
101 | 
102 |       {metadata.input_schema?.length && (
103 |         <>
104 |           <div className="text-xs text-[#aaa] mb-1">Input Parameters</div>
105 |           <ul className="pl-4 text-xs list-disc marker:text-[#7ac5ff]">
106 |             {metadata.input_schema.map((p) => (
107 |               <li key={p.name} className="mb-1">
108 |                 <span className="text-[#7ac5ff]">{p.name}</span>
109 |                 <span className="text-[#aaa]"> ({p.type})</span>
110 |                 {p.required && <span className="text-[#ff7a7a]"> *</span>}
111 |               </li>
112 |             ))}
113 |           </ul>
114 |         </>
115 |       )}
116 |     </>
117 |   );
118 | 
119 |   return (
120 |     <>
121 |       {/* row button */}
122 |       <li>
123 |         <button
124 |           className={`w-full text-left py-1.5 ${
125 |             selected ? "font-semibold text-[#7ac5ff]" : "text-[#ccc]"
126 |           }`}
127 |           onClick={() => onSelect(id)}
128 |         >
129 |           {displayName()}
130 |         </button>
131 |       </li>
132 | 
133 |       {/* details panel */}
134 |       {selected && metadata && (
135 |         <li className="py-2 pl-4 border-l border-[#444] my-1 ml-1">
136 |           <div className="flex justify-between items-center mb-2">
137 |             <h4 className="m-0 text-sm text-[#ddd]">Details</h4>
138 |             {!isEditing && (
139 |               <button
140 |                 onClick={() => {
141 |                   setEdited({ ...metadata });
142 |                   setIsEditing(true);
143 |                 }}
144 |                 className="bg-[#444] text-white py-1 px-2 rounded text-xs"
145 |               >
146 |                 Edit
147 |               </button>
148 |             )}
149 |           </div>
150 |           {isEditing ? editForm : readOnly}
151 |         </li>
152 |       )}
153 |     </>
154 |   );
155 | };
156 | 
157 | export default WorkflowItem;
158 | 


--------------------------------------------------------------------------------
/ui/src/components/workflow-layout.tsx:
--------------------------------------------------------------------------------
  1 | import React, {
  2 |   useState,
  3 |   useCallback,
  4 |   useLayoutEffect,
  5 |   MouseEvent,
  6 |   useEffect,
  7 | } from "react";
  8 | import {
  9 |   ReactFlow,
 10 |   Background,
 11 |   Controls,
 12 |   MiniMap,
 13 |   addEdge,
 14 |   useNodesState,
 15 |   useEdgesState,
 16 |   type OnConnect,
 17 |   useReactFlow,
 18 | } from "@xyflow/react";
 19 | import { type Node } from "@xyflow/react";
 20 | import { NodeData } from "../types/node-config-menu.types";
 21 | import { jsonToFlow } from "../utils/json-to-flow";
 22 | import { type WorkflowMetadata } from "../types/workflow-layout.types";
 23 | import Sidebar from "./sidebar";
 24 | import { NodeConfigMenu } from "./node-config-menu";
 25 | import { PlayButton } from "./play-button";
 26 | import NoWorkflowsMessage from "./no-workflow-message";
 27 | import { $api } from "../lib/api";
 28 | 
 29 | const WorkflowLayout: React.FC = () => {
 30 |   const [selected, setSelected] = useState<string | null>(null);
 31 |   const [nodes, setNodes, onNodesChange] = useNodesState([]);
 32 |   const [edges, setEdges, onEdgesChange] = useEdgesState([]);
 33 |   const [selectedNode, setSelectedNode] = useState<Node<NodeData> | null>(null);
 34 |   const [workflowMetadata, setWorkflowMetadata] =
 35 |     useState<WorkflowMetadata | null>(null);
 36 |   const [savedNodePositions, setSavedNodePositions] = useState<
 37 |     Record<string, Record<string, { x: number; y: number }>>
 38 |   >({});
 39 |   const { fitView } = useReactFlow();
 40 | 
 41 |   // ----- Queries using $api -----
 42 |   // Fetch all workflows
 43 |   const { data: workflowsResponse, isLoading: isLoadingWorkflows } =
 44 |     $api.useQuery("get", "/api/workflows");
 45 | 
 46 |   const workflows: string[] = workflowsResponse?.workflows ?? [];
 47 | 
 48 |   // Fetch a specific workflow (enabled only when selected is truthy)
 49 |   const { data: selectedWorkflow, isLoading: isLoadingSelectedWorkflow } =
 50 |     $api.useQuery(
 51 |       "get",
 52 |       "/api/workflows/{name}",
 53 |       selected
 54 |         ? {
 55 |             params: { path: { name: selected } },
 56 |           }
 57 |         : ({} as any),
 58 |       {
 59 |         enabled: !!selected,
 60 |       }
 61 |     );
 62 | 
 63 |   // Mutation for updating workflow metadata
 64 |   const updateMetadataMutation = $api.useMutation(
 65 |     "post",
 66 |     "/api/workflows/update-metadata"
 67 |   );
 68 | 
 69 |   const updateWorkflowMetadata = useCallback(
 70 |     async (name: string, metadata: WorkflowMetadata) => {
 71 |       await updateMetadataMutation.mutateAsync({
 72 |         body: { name, metadata } as any,
 73 |       });
 74 |     },
 75 |     [updateMetadataMutation]
 76 |   );
 77 | 
 78 |   const isUpdating = updateMetadataMutation.isPending;
 79 | 
 80 |   const onConnect: OnConnect = useCallback(
 81 |     (connection) => setEdges((edges) => addEdge(connection, edges)),
 82 |     [setEdges]
 83 |   );
 84 | 
 85 |   // Handle node click to show configuration
 86 |   const onNodeClick = useCallback((_: MouseEvent, node: Node<NodeData>) => {
 87 |     setSelectedNode(node);
 88 |   }, []);
 89 | 
 90 |   // Close the node configuration menu
 91 |   const closeNodeMenu = useCallback(() => {
 92 |     setSelectedNode(null);
 93 |   }, []);
 94 | 
 95 |   // Fit view when nodes change
 96 |   useLayoutEffect(() => {
 97 |     if (nodes.length > 0) {
 98 |       window.requestAnimationFrame(() => {
 99 |         fitView({ padding: 0.2 });
100 |       });
101 |     }
102 |   }, [nodes.length, fitView]);
103 | 
104 |   // Update nodes and edges when selected workflow changes
105 |   useEffect(() => {
106 |     if (selectedWorkflow) {
107 |       const flowData = jsonToFlow(selectedWorkflow);
108 | 
109 |       // Apply saved positions if available
110 |       if (selected && savedNodePositions[selected]) {
111 |         const savedPositionsForWorkflow = savedNodePositions[selected] || {};
112 |         const nodesWithSavedPositions = flowData.nodes.map((node: any) => {
113 |           const savedPosition = savedPositionsForWorkflow[node.id];
114 |           if (savedPosition) {
115 |             return {
116 |               ...node,
117 |               position: savedPosition,
118 |             };
119 |           }
120 |           return node;
121 |         });
122 |         setNodes(nodesWithSavedPositions as any);
123 |       } else {
124 |         setNodes(flowData.nodes as any);
125 |       }
126 | 
127 |       setEdges(flowData.edges as any);
128 |       setWorkflowMetadata(flowData.metadata);
129 |     }
130 |   }, [selectedWorkflow, selected, savedNodePositions, setNodes, setEdges]);
131 | 
132 |   // Handle node drag stop to save positions
133 |   const onNodeDragStop = useCallback(
134 |     (_: React.MouseEvent, node: Node) => {
135 |       if (selected) {
136 |         setSavedNodePositions((prev) => {
137 |           const workflowPositions = prev[selected] || {};
138 |           return {
139 |             ...prev,
140 |             [selected]: {
141 |               ...workflowPositions,
142 |               [node.id]: { x: node.position.x, y: node.position.y },
143 |             },
144 |           };
145 |         });
146 |       }
147 |     },
148 |     [selected]
149 |   );
150 | 
151 |   // Auto-select first workflow if none selected
152 |   useEffect(() => {
153 |     if (workflows.length > 0 && !selected) {
154 |       setSelected(workflows[0]!);
155 |     }
156 |   }, [workflows, selected]);
157 | 
158 |   const isLoading = isLoadingWorkflows || isLoadingSelectedWorkflow;
159 | 
160 |   if (isLoading) {
161 |     return (
162 |       <div className="flex h-screen flex-col items-center justify-center bg-[#2a2a2a] text-white">
163 |         <img
164 |           src="/browseruse.png"
165 |           alt="Loading..."
166 |           className="mb-5 h-auto w-30 animate-spin"
167 |         />
168 |         <div className="text-lg">Loading workflows...</div>
169 |       </div>
170 |     );
171 |   }
172 | 
173 |   if (!workflows.length) return <NoWorkflowsMessage />;
174 | 
175 |   return (
176 |     <div className="flex h-screen font-sans">
177 |       <Sidebar
178 |         workflows={workflows}
179 |         onSelect={setSelected}
180 |         selected={selected}
181 |         workflowMetadata={workflowMetadata}
182 |         onUpdateMetadata={async (metadata: WorkflowMetadata) => {
183 |           if (selected) {
184 |             await updateWorkflowMetadata(selected, metadata);
185 |           }
186 |         }}
187 |       />
188 | 
189 |       <div className="relative flex-1">
190 |         {nodes.length ? (
191 |           <>
192 |             <ReactFlow
193 |               nodes={nodes}
194 |               edges={edges}
195 |               colorMode="dark"
196 |               onNodesChange={onNodesChange}
197 |               onEdgesChange={onEdgesChange}
198 |               onConnect={onConnect}
199 |               onNodeClick={onNodeClick}
200 |               onNodeDragStop={onNodeDragStop}
201 |               fitView
202 |             >
203 |               <Background />
204 |               <MiniMap />
205 |               <Controls />
206 |             </ReactFlow>
207 | 
208 |             {/* actions */}
209 |             <div className="absolute right-5 top-5 z-10 flex gap-2">
210 |               <PlayButton
211 |                 workflowName={selected}
212 |                 workflowMetadata={workflowMetadata}
213 |               />
214 | 
215 |               <button
216 |                 title="Refresh workflow"
217 |                 className="flex h-9 w-9 items-center justify-center rounded-full bg-[#2a2a2a] text-white shadow transition-transform duration-200 ease-in-out hover:scale-105 hover:bg-blue-500"
218 |                 onClick={async () => {
219 |                   if (selected && workflowMetadata) {
220 |                     await updateWorkflowMetadata(selected, workflowMetadata);
221 |                   }
222 |                 }}
223 |                 disabled={isUpdating}
224 |               >
225 |                 {/* hero‑icons refresh */}
226 |                 <svg
227 |                   xmlns="http://www.w3.org/2000/svg"
228 |                   viewBox="0 0 24 24"
229 |                   className="h-4 w-4"
230 |                   fill="none"
231 |                   stroke="currentColor"
232 |                   strokeWidth={2}
233 |                   strokeLinecap="round"
234 |                   strokeLinejoin="round"
235 |                 >
236 |                   <path d="M21.5 2v6h-6M2.5 22v-6h6M2 11.5a10 10 0 0 1 18.8-4.3M22 12.5a10 10 0 0 1-18.8 4.3" />
237 |                 </svg>
238 |               </button>
239 |             </div>
240 |           </>
241 |         ) : (
242 |           <div className="m-8 text-gray-500">
243 |             Select a workflow to visualize
244 |           </div>
245 |         )}
246 | 
247 |         {selectedNode && (
248 |           <NodeConfigMenu
249 |             node={selectedNode}
250 |             onClose={closeNodeMenu}
251 |             workflowFilename={selected}
252 |           />
253 |         )}
254 |       </div>
255 |     </div>
256 |   );
257 | };
258 | 
259 | export default WorkflowLayout;
260 | 


--------------------------------------------------------------------------------
/ui/src/index.css:
--------------------------------------------------------------------------------
 1 | @import "tailwindcss";
 2 | 
 3 | :root {
 4 |   font-family: Inter, system-ui, Avenir, Helvetica, Arial, sans-serif;
 5 |   line-height: 1.5;
 6 |   font-weight: 400;
 7 | }
 8 | 
 9 | html,
10 | body,
11 | #root {
12 |   height: 100%;
13 |   margin: 0;
14 | }
15 | 


--------------------------------------------------------------------------------
/ui/src/lib/api/index.ts:
--------------------------------------------------------------------------------
 1 | import createFetchClient from "openapi-fetch";
 2 | import createClient from "openapi-react-query";
 3 | import type { paths } from "./apigen"; // generated by openapi-typescript
 4 | 
 5 | export const fetchClient = createFetchClient<paths>({
 6 |   baseUrl: "http://localhost:8000",
 7 | });
 8 | 
 9 | export const $api = createClient(fetchClient);
10 | 
11 | export default $api;
12 | 


--------------------------------------------------------------------------------
/ui/src/lib/api/openapi.json:
--------------------------------------------------------------------------------
1 | {"openapi":"3.1.0","info":{"title":"Workflow Execution Service","version":"0.1.0"},"paths":{"/api/workflows":{"get":{"summary":"List Workflows","operationId":"list_workflows_api_workflows_get","responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowListResponse"}}}}}}},"/api/workflows/{name}":{"get":{"summary":"Get Workflow","operationId":"get_workflow_api_workflows__name__get","parameters":[{"name":"name","in":"path","required":true,"schema":{"type":"string","title":"Name"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"type":"string","title":"Response Get Workflow Api Workflows  Name  Get"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/api/workflows/update":{"post":{"summary":"Update Workflow","operationId":"update_workflow_api_workflows_update_post","requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowUpdateRequest"}}},"required":true},"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/api/workflows/update-metadata":{"post":{"summary":"Update Workflow Metadata","operationId":"update_workflow_metadata_api_workflows_update_metadata_post","requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowMetadataUpdateRequest"}}},"required":true},"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/api/workflows/execute":{"post":{"summary":"Execute Workflow","operationId":"execute_workflow_api_workflows_execute_post","requestBody":{"content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowExecuteRequest"}}},"required":true},"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowExecuteResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/api/workflows/logs/{task_id}":{"get":{"summary":"Get Logs","operationId":"get_logs_api_workflows_logs__task_id__get","parameters":[{"name":"task_id","in":"path","required":true,"schema":{"type":"string","title":"Task Id"}},{"name":"position","in":"query","required":false,"schema":{"type":"integer","default":0,"title":"Position"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowLogsResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/api/workflows/tasks/{task_id}/status":{"get":{"summary":"Get Task Status","operationId":"get_task_status_api_workflows_tasks__task_id__status_get","parameters":[{"name":"task_id","in":"path","required":true,"schema":{"type":"string","title":"Task Id"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowStatusResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/api/workflows/tasks/{task_id}/cancel":{"post":{"summary":"Cancel Workflow","operationId":"cancel_workflow_api_workflows_tasks__task_id__cancel_post","parameters":[{"name":"task_id","in":"path","required":true,"schema":{"type":"string","title":"Task Id"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/WorkflowCancelResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}}},"components":{"schemas":{"HTTPValidationError":{"properties":{"detail":{"items":{"$ref":"#/components/schemas/ValidationError"},"type":"array","title":"Detail"}},"type":"object","title":"HTTPValidationError"},"ValidationError":{"properties":{"loc":{"items":{"anyOf":[{"type":"string"},{"type":"integer"}]},"type":"array","title":"Location"},"msg":{"type":"string","title":"Message"},"type":{"type":"string","title":"Error Type"}},"type":"object","required":["loc","msg","type"],"title":"ValidationError"},"WorkflowCancelResponse":{"properties":{"success":{"type":"boolean","title":"Success"},"message":{"type":"string","title":"Message"}},"type":"object","required":["success","message"],"title":"WorkflowCancelResponse"},"WorkflowExecuteRequest":{"properties":{"name":{"type":"string","title":"Name"},"inputs":{"type":"object","title":"Inputs"}},"type":"object","required":["name","inputs"],"title":"WorkflowExecuteRequest"},"WorkflowExecuteResponse":{"properties":{"success":{"type":"boolean","title":"Success"},"task_id":{"type":"string","title":"Task Id"},"workflow":{"type":"string","title":"Workflow"},"log_position":{"type":"integer","title":"Log Position"},"message":{"type":"string","title":"Message"}},"type":"object","required":["success","task_id","workflow","log_position","message"],"title":"WorkflowExecuteResponse"},"WorkflowListResponse":{"properties":{"workflows":{"items":{"type":"string"},"type":"array","title":"Workflows"}},"type":"object","required":["workflows"],"title":"WorkflowListResponse"},"WorkflowLogsResponse":{"properties":{"logs":{"items":{"type":"string"},"type":"array","title":"Logs"},"position":{"type":"integer","title":"Position"},"log_position":{"type":"integer","title":"Log Position"},"status":{"type":"string","title":"Status"},"result":{"anyOf":[{"items":{"type":"object"},"type":"array"},{"type":"null"}],"title":"Result"},"error":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Error"}},"type":"object","required":["logs","position","log_position","status"],"title":"WorkflowLogsResponse"},"WorkflowMetadataUpdateRequest":{"properties":{"name":{"type":"string","title":"Name"},"metadata":{"type":"object","title":"Metadata"}},"type":"object","required":["name","metadata"],"title":"WorkflowMetadataUpdateRequest"},"WorkflowResponse":{"properties":{"success":{"type":"boolean","title":"Success"},"error":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Error"}},"type":"object","required":["success"],"title":"WorkflowResponse"},"WorkflowStatusResponse":{"properties":{"task_id":{"type":"string","title":"Task Id"},"status":{"type":"string","title":"Status"},"workflow":{"type":"string","title":"Workflow"},"result":{"anyOf":[{"items":{"type":"object"},"type":"array"},{"type":"null"}],"title":"Result"},"error":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Error"}},"type":"object","required":["task_id","status","workflow"],"title":"WorkflowStatusResponse"},"WorkflowUpdateRequest":{"properties":{"filename":{"type":"string","title":"Filename"},"nodeId":{"type":"integer","title":"Nodeid"},"stepData":{"type":"object","title":"Stepdata"}},"type":"object","required":["filename","nodeId","stepData"],"title":"WorkflowUpdateRequest"}}}}


--------------------------------------------------------------------------------
/ui/src/main.tsx:
--------------------------------------------------------------------------------
 1 | import React from 'react';
 2 | import ReactDOM from 'react-dom/client';
 3 | 
 4 | import App from './App';
 5 | 
 6 | import './index.css';
 7 | 
 8 | ReactDOM.createRoot(document.getElementById('root')!).render(
 9 |   <React.StrictMode>
10 |     <App />
11 |   </React.StrictMode>
12 | );
13 | 


--------------------------------------------------------------------------------
/ui/src/types/log-viewer.types.ts:
--------------------------------------------------------------------------------
1 | export interface LogViewerProps {
2 |   taskId: string | null;
3 |   initialPosition: number;
4 |   onStatusChange?: (status: string) => void;
5 |   onError?: (error: string) => void;
6 |   onCancel?: () => void;
7 |   onClose?: () => void;
8 | }


--------------------------------------------------------------------------------
/ui/src/types/node-config-menu.types.ts:
--------------------------------------------------------------------------------
 1 | import type { Node } from '@xyflow/react';
 2 | 
 3 | export interface StepData {
 4 |   description: string;
 5 |   output: any | null;
 6 |   timestamp: number | null;
 7 |   tabId: number | null;
 8 |   type: 'navigation' | 'click' | 'select_change' | 'input';
 9 |   url?: string;
10 |   cssSelector?: string;
11 |   xpath?: string;
12 |   elementTag?: string;
13 |   elementText?: string;
14 |   selectedText?: string;
15 |   value?: string;
16 | }
17 | 
18 | export interface NodeData extends Record<string, unknown> {
19 |   label: string;
20 |   stepData: StepData;
21 | }
22 | 
23 | export interface NodeConfigMenuProps {
24 |     node: Node<NodeData> | null;
25 |     onClose: () => void;
26 |     workflowFilename: string | null;
27 | }


--------------------------------------------------------------------------------
/ui/src/types/play-button.types.ts:
--------------------------------------------------------------------------------
 1 | import { WorkflowMetadata } from './workflow-layout.types';
 2 | 
 3 | export interface PlayButtonProps {
 4 |   workflowName: string | null;
 5 |   workflowMetadata: WorkflowMetadata | null;
 6 | }
 7 | 
 8 | export interface InputField {
 9 |   name: string;
10 |   type: string;
11 |   required: boolean;
12 |   value: any;
13 | }


--------------------------------------------------------------------------------
/ui/src/types/sidebar.types.ts:
--------------------------------------------------------------------------------
 1 | import { type WorkflowMetadata } from './workflow-layout.types';
 2 | 
 3 | export interface SidebarProps {
 4 |   workflows: string[];
 5 |   onSelect: (wf: string) => void;
 6 |   selected: string | null;
 7 |   workflowMetadata: WorkflowMetadata | null;
 8 |   onUpdateMetadata: (metadata: WorkflowMetadata) => Promise<void>;
 9 |   allWorkflowsMetadata?: Record<string, WorkflowMetadata>;
10 | }


--------------------------------------------------------------------------------
/ui/src/types/workflow-layout.types.ts:
--------------------------------------------------------------------------------
 1 | import { z } from 'zod';
 2 | import type { Node, BuiltInNode } from '@xyflow/react';
 3 | 
 4 | export type PositionLoggerNode = Node<{ label: string }, 'position-logger'>;
 5 | export type AppNode = BuiltInNode | PositionLoggerNode;
 6 | 
 7 | /* ── Input field definition ────────────────────────────────────────── */
 8 | const inputFieldSchema = z.object({
 9 |   name: z.string(),
10 |   type: z.enum(['string', 'number', 'boolean']),
11 |   required: z.boolean(),
12 | });
13 | 
14 | /* ── Step definition ───────────────────────────────────────────────── */
15 | const stepSchema = z.object({
16 |   /* core fields */
17 |   description: z.string(),
18 |   output: z.unknown().nullable(),
19 |   timestamp: z.number().int().nullable(),
20 |   tabId: z.number().int().nullable(),
21 |   type: z.enum(['navigation', 'click', 'select_change', 'input']),
22 | 
23 |   /* optional fields (vary by step type) */
24 |   url: z.string().url().optional(),
25 |   cssSelector: z.string().optional(),
26 |   xpath: z.string().optional(),
27 |   elementTag: z.string().optional(),
28 |   elementText: z.string().optional(),
29 |   selectedText: z.string().optional(),
30 |   value: z.string().optional(),
31 | });
32 | 
33 | /* ── Workflow wrapper ──────────────────────────────────────────────── */
34 | export const workflowSchema = z.object({
35 |   workflow_analysis: z.string(),
36 |   name: z.string(),
37 |   description: z.string(),
38 |   version: z.string(),
39 |   steps: z.array(stepSchema),
40 |   input_schema: z.array(inputFieldSchema),
41 | });
42 | 
43 | /* ── Inferred TypeScript type ───────────────────────────────────────– */
44 | export type Workflow = z.infer<typeof workflowSchema>;
45 | 
46 | export interface WorkflowStep {
47 |   description: string;
48 |   type: string;
49 |   [key: string]: any;
50 | }
51 | 
52 | export interface WorkflowMetadata {
53 |   name: string;
54 |   description: string;
55 |   version: string;
56 |   input_schema: any[];
57 |   workflow_analysis?: string;
58 | }
59 | 
60 | export interface WorkflowItemProps {
61 |   id: string;
62 |   selected: boolean;
63 |   metadata?: WorkflowMetadata;
64 |   onSelect: (id: string) => void;
65 |   onUpdateMetadata: (m: WorkflowMetadata) => Promise<void>;
66 | }
67 | 


--------------------------------------------------------------------------------
/ui/src/utils/json-to-flow.ts:
--------------------------------------------------------------------------------
 1 | import { Edge } from '@xyflow/react';
 2 | import { Workflow, WorkflowStep, WorkflowMetadata, AppNode } from '../types/workflow-layout.types';
 3 | 
 4 | export function jsonToFlow(workflow: string): { 
 5 |   nodes: AppNode[]; 
 6 |   edges: Edge[];
 7 |   metadata: WorkflowMetadata;
 8 | } {
 9 |   const parsedWorkflow = JSON.parse(workflow) as Workflow;
10 |   const nodes: AppNode[] = parsedWorkflow.steps.map((step: WorkflowStep, idx: number) => ({
11 |     id: String(idx),
12 |     data: { 
13 |       label: `${step.description}`, 
14 |       stepData: step,
15 |       workflowName: parsedWorkflow.name
16 |     },
17 |     position: { x: 0, y: idx * 100 }
18 |   }));
19 | 
20 |   const edges: Edge[] = parsedWorkflow.steps.slice(1).map((_, idx) => ({
21 |     id: `e${idx}-${idx + 1}`,
22 |     source: String(idx),
23 |     target: String(idx + 1),
24 |     animated: true,
25 |   }));
26 | 
27 |   const metadata: WorkflowMetadata = {
28 |     name: parsedWorkflow.name,
29 |     description: parsedWorkflow.description,
30 |     version: parsedWorkflow.version,
31 |     input_schema: parsedWorkflow.input_schema,
32 |     workflow_analysis: parsedWorkflow.workflow_analysis
33 |   };
34 | 
35 |   return { nodes, edges, metadata };
36 | }


--------------------------------------------------------------------------------
/ui/src/vite-env.d.ts:
--------------------------------------------------------------------------------
1 | /// <reference types="vite/client" />
2 | 


--------------------------------------------------------------------------------
/ui/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "target": "ES2020",
 4 |     "useDefineForClassFields": true,
 5 |     "lib": [
 6 |       "ES2020",
 7 |       "DOM",
 8 |       "DOM.Iterable"
 9 |     ],
10 |     "module": "ESNext",
11 |     "skipLibCheck": true,
12 |     /* Bundler mode */
13 |     "moduleResolution": "bundler",
14 |     "allowImportingTsExtensions": true,
15 |     "resolveJsonModule": true,
16 |     "isolatedModules": true,
17 |     "noEmit": true,
18 |     "jsx": "react-jsx",
19 |     "noUncheckedIndexedAccess": true,
20 |     /* Linting */
21 |     "strict": true,
22 |     "noUnusedLocals": true,
23 |     "noUnusedParameters": true,
24 |     "noFallthroughCasesInSwitch": true
25 |   },
26 |   "include": [
27 |     "src"
28 |   ],
29 |   "references": [
30 |     {
31 |       "path": "./tsconfig.node.json"
32 |     }
33 |   ]
34 | }


--------------------------------------------------------------------------------
/ui/tsconfig.node.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "composite": true,
 4 |     "skipLibCheck": true,
 5 |     "module": "ESNext",
 6 |     "moduleResolution": "bundler",
 7 |     "allowSyntheticDefaultImports": true
 8 |   },
 9 |   "include": ["vite.config.ts"]
10 | }
11 | 


--------------------------------------------------------------------------------
/ui/vite.config.ts:
--------------------------------------------------------------------------------
1 | import { defineConfig } from 'vite'
2 | import react from '@vitejs/plugin-react'
3 | import tailwindcss from '@tailwindcss/vite'
4 | 
5 | // https://vitejs.dev/config/
6 | export default defineConfig({
7 |   plugins: [react(), tailwindcss()],
8 | })
9 | 


--------------------------------------------------------------------------------
/workflows/.env.example:
--------------------------------------------------------------------------------
1 | # We support all langchain models, openai only for demo purposes
2 | OPENAI_API_KEY=


--------------------------------------------------------------------------------
/workflows/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | share/python-wheels/
 24 | *.egg-info/
 25 | .installed.cfg
 26 | *.egg
 27 | MANIFEST
 28 | 
 29 | # PyInstaller
 30 | #  Usually these files are written by a python script from a template
 31 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 32 | *.manifest
 33 | *.spec
 34 | 
 35 | # Installer logs
 36 | pip-log.txt
 37 | pip-delete-this-directory.txt
 38 | 
 39 | # Unit test / coverage reports
 40 | htmlcov/
 41 | .tox/
 42 | .nox/
 43 | .coverage
 44 | .coverage.*
 45 | .cache
 46 | nosetests.xml
 47 | coverage.xml
 48 | *.cover
 49 | *.py,cover
 50 | .hypothesis/
 51 | .pytest_cache/
 52 | cover/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | .pybuilder/
 76 | target/
 77 | 
 78 | # Jupyter Notebook
 79 | .ipynb_checkpoints
 80 | 
 81 | # IPython
 82 | profile_default/
 83 | ipython_config.py
 84 | 
 85 | # pyenv
 86 | #   For a library or package, you might want to ignore these files since the code is
 87 | #   intended to run in multiple environments; otherwise, check them in:
 88 | # .python-version
 89 | 
 90 | # pipenv
 91 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 92 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 93 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 94 | #   install all needed dependencies.
 95 | #Pipfile.lock
 96 | 
 97 | # poetry
 98 | #   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
 99 | #   This is especially recommended for binary packages to ensure reproducibility, and is more
100 | #   commonly ignored for libraries.
101 | #   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
102 | #poetry.lock
103 | 
104 | # pdm
105 | #   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
106 | #pdm.lock
107 | #   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
108 | #   in version control.
109 | #   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
110 | .pdm.toml
111 | .pdm-python
112 | .pdm-build/
113 | 
114 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
115 | __pypackages__/
116 | 
117 | # Celery stuff
118 | celerybeat-schedule
119 | celerybeat.pid
120 | 
121 | # SageMath parsed files
122 | *.sage.py
123 | 
124 | # Environments
125 | .env
126 | .venv
127 | env/
128 | venv/
129 | ENV/
130 | env.bak/
131 | venv.bak/
132 | test_env/
133 | myenv
134 | 
135 | 
136 | # Spyder project settings
137 | .spyderproject
138 | .spyproject
139 | 
140 | # Rope project settings
141 | .ropeproject
142 | 
143 | # mkdocs documentation
144 | /site
145 | 
146 | # mypy
147 | .mypy_cache/
148 | .dmypy.json
149 | dmypy.json
150 | 
151 | # Pyre type checker
152 | .pyre/
153 | 
154 | # pytype static type analyzer
155 | .pytype/
156 | 
157 | # Cython debug symbols
158 | cython_debug/
159 | 
160 | # PyCharm
161 | #  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
162 | #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
163 | #  and can be added to the global gitignore or merged into this file.  For a more nuclear
164 | #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
165 | .idea/
166 | temp
167 | tmp
168 | 
169 | 
170 | .DS_Store
171 | 
172 | private_example.py
173 | private_example
174 | 
175 | browser_cookies.json
176 | cookies.json
177 | AgentHistory.json
178 | cv_04_24.pdf
179 | AgentHistoryList.json
180 | *.gif
181 | 
182 | # For Sharing (.pem files)
183 | .gradio/
184 | 
185 | # For Docker
186 | data/
187 | 
188 | # For Config Files (Current Settings)
189 | .config.pkl
190 | *.pdf
191 | 
192 | user_data_dir


--------------------------------------------------------------------------------
/workflows/.python-version:
--------------------------------------------------------------------------------
1 | 3.12


--------------------------------------------------------------------------------
/workflows/.vscode/launch.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "version": "0.2.0",
 3 |     "configurations": [
 4 |         {
 5 |             "name": "Python Debugger: Current File",
 6 |             "type": "debugpy",
 7 |             "request": "launch",
 8 |             "program": "${file}",
 9 |             "justMyCode": false,
10 |             "env": {
11 |                 "PYTHONPATH": "${workspaceFolder}"
12 |             },
13 |             "console": "integratedTerminal"
14 |         },
15 |     ]
16 | }


--------------------------------------------------------------------------------
/workflows/.vscode/settings.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "python.analysis.typeCheckingMode": "basic",
 3 |     "[python]": {
 4 |         "editor.defaultFormatter": "charliermarsh.ruff",
 5 |         "editor.formatOnSave": true,
 6 |         "editor.codeActionsOnSave": {
 7 |             "source.fixAll.ruff": "explicit",
 8 |             "source.organizeImports.ruff": "explicit"
 9 |         }
10 |     }
11 | }


--------------------------------------------------------------------------------
/workflows/README.md:
--------------------------------------------------------------------------------
1 | # Workflow Use python package
2 | 
3 | This is the python package for Workflow Use. It is used to create and execute workflows.
4 | 
5 | Currently only used to reserve the pypi package name.
6 | 


--------------------------------------------------------------------------------
/workflows/backend/api.py:
--------------------------------------------------------------------------------
 1 | import uvicorn
 2 | from fastapi import FastAPI
 3 | from fastapi.middleware.cors import CORSMiddleware
 4 | 
 5 | from .routers import router
 6 | 
 7 | app = FastAPI(title='Workflow Execution Service')
 8 | 
 9 | # Add CORS middleware
10 | app.add_middleware(
11 | 	CORSMiddleware,
12 | 	allow_origins=['http://localhost:5173'],
13 | 	allow_credentials=True,
14 | 	allow_methods=['*'],
15 | 	allow_headers=['*'],
16 | )
17 | 
18 | # Include routers
19 | app.include_router(router)
20 | 
21 | 
22 | # Optional standalone runner
23 | if __name__ == '__main__':
24 | 	uvicorn.run('api:app', host='127.0.0.1', port=8000, log_level='info')
25 | 


--------------------------------------------------------------------------------
/workflows/backend/routers.py:
--------------------------------------------------------------------------------
  1 | import asyncio
  2 | import uuid
  3 | 
  4 | from fastapi import APIRouter, HTTPException
  5 | 
  6 | from .service import WorkflowService
  7 | from .views import (
  8 | 	WorkflowCancelResponse,
  9 | 	WorkflowExecuteRequest,
 10 | 	WorkflowExecuteResponse,
 11 | 	WorkflowListResponse,
 12 | 	WorkflowLogsResponse,
 13 | 	WorkflowMetadataUpdateRequest,
 14 | 	WorkflowResponse,
 15 | 	WorkflowStatusResponse,
 16 | 	WorkflowUpdateRequest,
 17 | )
 18 | 
 19 | router = APIRouter(prefix='/api/workflows')
 20 | 
 21 | 
 22 | def get_service() -> WorkflowService:
 23 | 	return WorkflowService()
 24 | 
 25 | 
 26 | @router.get('', response_model=WorkflowListResponse)
 27 | async def list_workflows():
 28 | 	service = get_service()
 29 | 	workflows = service.list_workflows()
 30 | 	return WorkflowListResponse(workflows=workflows)
 31 | 
 32 | 
 33 | @router.get('/{name}', response_model=str)
 34 | async def get_workflow(name: str):
 35 | 	service = get_service()
 36 | 	return service.get_workflow(name)
 37 | 
 38 | 
 39 | @router.post('/update', response_model=WorkflowResponse)
 40 | async def update_workflow(request: WorkflowUpdateRequest):
 41 | 	service = get_service()
 42 | 	return service.update_workflow(request)
 43 | 
 44 | 
 45 | @router.post('/update-metadata', response_model=WorkflowResponse)
 46 | async def update_workflow_metadata(request: WorkflowMetadataUpdateRequest):
 47 | 	service = get_service()
 48 | 	return service.update_workflow_metadata(request)
 49 | 
 50 | 
 51 | @router.post('/execute', response_model=WorkflowExecuteResponse)
 52 | async def execute_workflow(request: WorkflowExecuteRequest):
 53 | 	service = get_service()
 54 | 	workflow_name = request.name
 55 | 	inputs = request.inputs
 56 | 
 57 | 	if not workflow_name:
 58 | 		raise HTTPException(status_code=400, detail='Missing workflow name')
 59 | 
 60 | 	workflow_path = service.tmp_dir / workflow_name
 61 | 	if not workflow_path.exists():
 62 | 		raise HTTPException(status_code=404, detail=f'Workflow {workflow_name} not found')
 63 | 
 64 | 	try:
 65 | 		task_id = str(uuid.uuid4())
 66 | 		cancel_event = asyncio.Event()
 67 | 		service.cancel_events[task_id] = cancel_event
 68 | 		log_pos = await service._log_file_position()
 69 | 
 70 | 		task = asyncio.create_task(service.run_workflow_in_background(task_id, request, cancel_event))
 71 | 		service.workflow_tasks[task_id] = task
 72 | 		task.add_done_callback(
 73 | 			lambda _: (
 74 | 				service.workflow_tasks.pop(task_id, None),
 75 | 				service.cancel_events.pop(task_id, None),
 76 | 			)
 77 | 		)
 78 | 		return WorkflowExecuteResponse(
 79 | 			success=True,
 80 | 			task_id=task_id,
 81 | 			workflow=workflow_name,
 82 | 			log_position=log_pos,
 83 | 			message=f"Workflow '{workflow_name}' execution started with task ID: {task_id}",
 84 | 		)
 85 | 	except Exception as exc:
 86 | 		raise HTTPException(status_code=500, detail=f'Error starting workflow: {exc}')
 87 | 
 88 | 
 89 | @router.get('/logs/{task_id}', response_model=WorkflowLogsResponse)
 90 | async def get_logs(task_id: str, position: int = 0):
 91 | 	service = get_service()
 92 | 	task_info = service.active_tasks.get(task_id)
 93 | 	logs, new_pos = await service._read_logs_from_position(position)
 94 | 	return WorkflowLogsResponse(
 95 | 		logs=logs,
 96 | 		position=new_pos,
 97 | 		log_position=new_pos,
 98 | 		status=task_info.status if task_info else 'unknown',
 99 | 		result=task_info.result if task_info else None,
100 | 		error=task_info.error if task_info else None,
101 | 	)
102 | 
103 | 
104 | @router.get('/tasks/{task_id}/status', response_model=WorkflowStatusResponse)
105 | async def get_task_status(task_id: str):
106 | 	service = get_service()
107 | 	task_info = service.get_task_status(task_id)
108 | 	if not task_info:
109 | 		raise HTTPException(status_code=404, detail=f'Task {task_id} not found')
110 | 	return task_info
111 | 
112 | 
113 | @router.post('/tasks/{task_id}/cancel', response_model=WorkflowCancelResponse)
114 | async def cancel_workflow(task_id: str):
115 | 	service = get_service()
116 | 	result = await service.cancel_workflow(task_id)
117 | 	if not result.success and result.message == 'Task not found':
118 | 		raise HTTPException(status_code=404, detail=f'Task {task_id} not found')
119 | 	return result
120 | 


--------------------------------------------------------------------------------
/workflows/backend/service.py:
--------------------------------------------------------------------------------
  1 | import asyncio
  2 | import json
  3 | import time
  4 | from pathlib import Path
  5 | from typing import Dict, List, Optional, Tuple
  6 | 
  7 | import aiofiles
  8 | from browser_use.browser.browser import Browser
  9 | from langchain_openai import ChatOpenAI
 10 | 
 11 | from workflow_use.controller.service import WorkflowController
 12 | from workflow_use.workflow.service import Workflow
 13 | 
 14 | from .views import (
 15 | 	TaskInfo,
 16 | 	WorkflowCancelResponse,
 17 | 	WorkflowExecuteRequest,
 18 | 	WorkflowMetadataUpdateRequest,
 19 | 	WorkflowResponse,
 20 | 	WorkflowStatusResponse,
 21 | 	WorkflowUpdateRequest,
 22 | )
 23 | 
 24 | 
 25 | class WorkflowService:
 26 | 	"""Workflow execution service."""
 27 | 
 28 | 	def __init__(self) -> None:
 29 | 		# ---------- Core resources ----------
 30 | 		self.tmp_dir: Path = Path('./tmp')
 31 | 		self.log_dir: Path = self.tmp_dir / 'logs'
 32 | 		self.log_dir.mkdir(exist_ok=True, parents=True)
 33 | 
 34 | 		# LLM / workflow executor
 35 | 		try:
 36 | 			self.llm_instance = ChatOpenAI(model='gpt-4.1-mini')
 37 | 		except Exception as exc:
 38 | 			print(f'Error initializing LLM: {exc}. Ensure OPENAI_API_KEY is set.')
 39 | 			self.llm_instance = None
 40 | 
 41 | 		self.browser_instance = Browser()
 42 | 		self.controller_instance = WorkflowController()
 43 | 
 44 | 		# In‑memory task tracking
 45 | 		self.active_tasks: Dict[str, TaskInfo] = {}
 46 | 		self.workflow_tasks: Dict[str, asyncio.Task] = {}
 47 | 		self.cancel_events: Dict[str, asyncio.Event] = {}
 48 | 
 49 | 	async def _log_file_position(self) -> int:
 50 | 		log_file = self.log_dir / 'backend.log'
 51 | 		if not log_file.exists():
 52 | 			async with aiofiles.open(log_file, 'w') as f:
 53 | 				await f.write('')
 54 | 			return 0
 55 | 		return log_file.stat().st_size
 56 | 
 57 | 	async def _read_logs_from_position(self, position: int) -> Tuple[List[str], int]:
 58 | 		log_file = self.log_dir / 'backend.log'
 59 | 		if not log_file.exists():
 60 | 			return [], 0
 61 | 
 62 | 		current_size = log_file.stat().st_size
 63 | 		if position >= current_size:
 64 | 			return [], position
 65 | 
 66 | 		async with aiofiles.open(log_file, 'r') as f:
 67 | 			await f.seek(position)
 68 | 			all_logs = await f.readlines()
 69 | 			new_logs = [
 70 | 				line
 71 | 				for line in all_logs
 72 | 				if not line.strip().startswith('INFO:')
 73 | 				and not line.strip().startswith('WARNING:')
 74 | 				and not line.strip().startswith('DEBUG:')
 75 | 				and not line.strip().startswith('ERROR:')
 76 | 			]
 77 | 		return new_logs, current_size
 78 | 
 79 | 	async def _write_log(self, log_file: Path, message: str) -> None:
 80 | 		async with aiofiles.open(log_file, 'a') as f:
 81 | 			await f.write(message)
 82 | 
 83 | 	def list_workflows(self) -> List[str]:
 84 | 		return [f.name for f in self.tmp_dir.iterdir() if f.is_file() and not f.name.startswith('temp_recording')]
 85 | 
 86 | 	def get_workflow(self, name: str) -> str:
 87 | 		wf_file = self.tmp_dir / name
 88 | 		return wf_file.read_text()
 89 | 
 90 | 	def update_workflow(self, request: WorkflowUpdateRequest) -> WorkflowResponse:
 91 | 		workflow_filename = request.filename
 92 | 		node_id = request.nodeId
 93 | 		updated_step_data = request.stepData
 94 | 
 95 | 		if not (workflow_filename and node_id is not None and updated_step_data):
 96 | 			return WorkflowResponse(success=False, error='Missing required fields')
 97 | 
 98 | 		wf_file = self.tmp_dir / workflow_filename
 99 | 		if not wf_file.exists():
100 | 			return WorkflowResponse(success=False, error=f"Workflow file '{workflow_filename}' not found")
101 | 
102 | 		workflow_content = json.loads(wf_file.read_text())
103 | 		steps = workflow_content.get('steps', [])
104 | 
105 | 		if 0 <= int(node_id) < len(steps):
106 | 			steps[int(node_id)] = updated_step_data
107 | 			wf_file.write_text(json.dumps(workflow_content, indent=2))
108 | 			return WorkflowResponse(success=True)
109 | 
110 | 		return WorkflowResponse(success=False, error='Node not found in workflow')
111 | 
112 | 	def update_workflow_metadata(self, request: WorkflowMetadataUpdateRequest) -> WorkflowResponse:
113 | 		workflow_name = request.name
114 | 		updated_metadata = request.metadata
115 | 
116 | 		if not (workflow_name and updated_metadata):
117 | 			return WorkflowResponse(success=False, error='Missing required fields')
118 | 
119 | 		wf_file = self.tmp_dir / workflow_name
120 | 		if not wf_file.exists():
121 | 			return WorkflowResponse(success=False, error='Workflow not found')
122 | 
123 | 		workflow_content = json.loads(wf_file.read_text())
124 | 		workflow_content['name'] = updated_metadata.get('name', workflow_content.get('name', ''))
125 | 		workflow_content['description'] = updated_metadata.get('description', workflow_content.get('description', ''))
126 | 		workflow_content['version'] = updated_metadata.get('version', workflow_content.get('version', ''))
127 | 
128 | 		if 'input_schema' in updated_metadata:
129 | 			workflow_content['input_schema'] = updated_metadata['input_schema']
130 | 
131 | 		wf_file.write_text(json.dumps(workflow_content, indent=2))
132 | 		return WorkflowResponse(success=True)
133 | 
134 | 	async def run_workflow_in_background(
135 | 		self,
136 | 		task_id: str,
137 | 		request: WorkflowExecuteRequest,
138 | 		cancel_event: asyncio.Event,
139 | 	) -> None:
140 | 		workflow_name = request.name
141 | 		inputs = request.inputs
142 | 		log_file = self.log_dir / 'backend.log'
143 | 		try:
144 | 			self.active_tasks[task_id] = TaskInfo(status='running', workflow=workflow_name)
145 | 			ts = time.strftime('%Y-%m-%d %H:%M:%S')
146 | 			await self._write_log(log_file, f"[{ts}] Starting workflow '{workflow_name}'\n")
147 | 			await self._write_log(log_file, f'[{ts}] Input parameters: {json.dumps(inputs)}\n')
148 | 
149 | 			if cancel_event.is_set():
150 | 				await self._write_log(log_file, f'[{ts}] Workflow cancelled before execution\n')
151 | 				self.active_tasks[task_id].status = 'cancelled'
152 | 				return
153 | 
154 | 			workflow_path = self.tmp_dir / workflow_name
155 | 			try:
156 | 				self.workflow_obj = Workflow.load_from_file(
157 | 					str(workflow_path), llm=self.llm_instance, browser=self.browser_instance, controller=self.controller_instance
158 | 				)
159 | 			except Exception as e:
160 | 				print(f'Error loading workflow: {e}')
161 | 				return
162 | 
163 | 			await self._write_log(log_file, f'[{ts}] Executing workflow...\n')
164 | 
165 | 			if cancel_event.is_set():
166 | 				await self._write_log(log_file, f'[{ts}] Workflow cancelled before execution\n')
167 | 				self.active_tasks[task_id].status = 'cancelled'
168 | 				return
169 | 
170 | 			result = await self.workflow_obj.run(inputs, close_browser_at_end=True, cancel_event=cancel_event)
171 | 
172 | 			if cancel_event.is_set():
173 | 				await self._write_log(log_file, f'[{ts}] Workflow execution was cancelled\n')
174 | 				self.active_tasks[task_id].status = 'cancelled'
175 | 				return
176 | 
177 | 			formatted_result = [
178 | 				{
179 | 					'step_id': i,
180 | 					'extracted_content': s.extracted_content,
181 | 					'status': 'completed',
182 | 				}
183 | 				for i, s in enumerate(result.step_results)
184 | 			]
185 | 			for step in formatted_result:
186 | 				await self._write_log(log_file, f'[{ts}] Completed step {step["step_id"]}: {step["extracted_content"]}\n')
187 | 
188 | 			self.active_tasks[task_id].status = 'completed'
189 | 			self.active_tasks[task_id].result = formatted_result
190 | 			await self._write_log(log_file, f'[{ts}] Workflow completed successfully with {len(result.step_results)} steps\n')
191 | 
192 | 		except asyncio.CancelledError:
193 | 			await self._write_log(log_file, f'[{time.strftime("%Y-%m-%d %H:%M:%S")}] Workflow force‑cancelled\n')
194 | 			self.active_tasks[task_id].status = 'cancelled'
195 | 			raise
196 | 		except Exception as exc:
197 | 			await self._write_log(log_file, f'[{time.strftime("%Y-%m-%d %H:%M:%S")}] Error: {exc}\n')
198 | 			self.active_tasks[task_id].status = 'failed'
199 | 			self.active_tasks[task_id].error = str(exc)
200 | 
201 | 	def get_task_status(self, task_id: str) -> Optional[WorkflowStatusResponse]:
202 | 		task_info = self.active_tasks.get(task_id)
203 | 		if not task_info:
204 | 			return None
205 | 
206 | 		return WorkflowStatusResponse(
207 | 			task_id=task_id,
208 | 			status=task_info.status,
209 | 			workflow=task_info.workflow,
210 | 			result=task_info.result,
211 | 			error=task_info.error,
212 | 		)
213 | 
214 | 	async def cancel_workflow(self, task_id: str) -> WorkflowCancelResponse:
215 | 		task_info = self.active_tasks.get(task_id)
216 | 		if not task_info:
217 | 			return WorkflowCancelResponse(success=False, message='Task not found')
218 | 		if task_info.status != 'running':
219 | 			return WorkflowCancelResponse(success=False, message=f'Task is already {task_info.status}')
220 | 
221 | 		task = self.workflow_tasks.get(task_id)
222 | 		cancel_event = self.cancel_events.get(task_id)
223 | 
224 | 		if cancel_event:
225 | 			cancel_event.set()
226 | 		if task and not task.done():
227 | 			task.cancel()
228 | 
229 | 		await self._write_log(
230 | 			self.log_dir / 'backend.log',
231 | 			f'[{time.strftime("%Y-%m-%d %H:%M:%S")}] Workflow execution for task {task_id} cancelled by user\n',
232 | 		)
233 | 
234 | 		self.active_tasks[task_id].status = 'cancelling'
235 | 		return WorkflowCancelResponse(success=True, message='Workflow cancellation requested')
236 | 


--------------------------------------------------------------------------------
/workflows/backend/views.py:
--------------------------------------------------------------------------------
 1 | from typing import Any, Dict, List, Optional
 2 | 
 3 | from pydantic import BaseModel
 4 | 
 5 | 
 6 | # Task Models
 7 | class TaskInfo(BaseModel):
 8 | 	status: str
 9 | 	workflow: str
10 | 	result: Optional[List[Dict[str, Any]]] = None
11 | 	error: Optional[str] = None
12 | 
13 | 
14 | # Request Models
15 | class WorkflowUpdateRequest(BaseModel):
16 | 	filename: str
17 | 	nodeId: int
18 | 	stepData: Dict[str, Any]
19 | 
20 | 
21 | class WorkflowMetadataUpdateRequest(BaseModel):
22 | 	name: str
23 | 	metadata: Dict[str, Any]
24 | 
25 | 
26 | class WorkflowExecuteRequest(BaseModel):
27 | 	name: str
28 | 	inputs: Dict[str, Any]
29 | 
30 | 
31 | # Response Models
32 | class WorkflowResponse(BaseModel):
33 | 	success: bool
34 | 	error: Optional[str] = None
35 | 
36 | 
37 | class WorkflowListResponse(BaseModel):
38 | 	workflows: List[str]
39 | 
40 | 
41 | class WorkflowExecuteResponse(BaseModel):
42 | 	success: bool
43 | 	task_id: str
44 | 	workflow: str
45 | 	log_position: int
46 | 	message: str
47 | 
48 | 
49 | class WorkflowLogsResponse(BaseModel):
50 | 	logs: List[str]
51 | 	position: int
52 | 	log_position: int
53 | 	status: str
54 | 	result: Optional[List[Dict[str, Any]]] = None
55 | 	error: Optional[str] = None
56 | 
57 | 
58 | class WorkflowStatusResponse(BaseModel):
59 | 	task_id: str
60 | 	status: str
61 | 	workflow: str
62 | 	result: Optional[List[Dict[str, Any]]] = None
63 | 	error: Optional[str] = None
64 | 
65 | 
66 | class WorkflowCancelResponse(BaseModel):
67 | 	success: bool
68 | 	message: str
69 | 


--------------------------------------------------------------------------------
/workflows/examples/example.workflow.json:
--------------------------------------------------------------------------------
  1 | {
  2 |   "workflow_analysis": "This workflow is about automating the process of filling out a government-related form on a website. The form requires personal information such as first name, middle name, last name, social security number, gender, and marital status. Inputs are needed for dynamic form values such as names and social security number. The workflow involves navigation, data entry, and selection of options within the form.",
  3 |   "name": "Government Form Submission",
  4 |   "description": "Automated submission of a government-related form.",
  5 |   "version": "1.0",
  6 |   "steps": [
  7 |     {
  8 |       "description": "Navigate to the form application's homepage.",
  9 |       "output": null,
 10 |       "timestamp": null,
 11 |       "tabId": null,
 12 |       "type": "navigation",
 13 |       "url": "https://v0-complex-form-example.vercel.app/"
 14 |     },
 15 |     {
 16 |       "description": "Click the 'Start Application' button to begin form entry.",
 17 |       "output": null,
 18 |       "timestamp": 1747409674925,
 19 |       "tabId": 1417505019,
 20 |       "type": "click",
 21 |       "cssSelector": "button.inline-flex.items-center.justify-center.gap-2.whitespace-nowrap.text-sm.font-medium.ring-offset-background.transition-colors.bg-primary.text-primary-foreground.h-11.rounded-md.px-8",
 22 |       "xpath": "body/div[1]/div[1]/a[1]/button[1]",
 23 |       "elementTag": "BUTTON",
 24 |       "elementText": "Start Application"
 25 |     },
 26 |     {
 27 |       "description": "Enter the first name into the form.",
 28 |       "output": null,
 29 |       "timestamp": 1747409678034,
 30 |       "tabId": 1417505019,
 31 |       "type": "input",
 32 |       "cssSelector": "input.flex.h-10.w-full.rounded-md.border.border-input.bg-background.px-3.py-2.text-base.ring-offset-background[id=\"firstName\"][name=\"firstName\"]",
 33 |       "value": "{first_name}",
 34 |       "xpath": "id(\"firstName\")",
 35 |       "elementTag": "INPUT"
 36 |     },
 37 |     {
 38 |       "description": "Press Tab to move to the next field.",
 39 |       "output": null,
 40 |       "timestamp": 1747409678270,
 41 |       "tabId": 1417505019,
 42 |       "type": "key_press",
 43 |       "cssSelector": "input.flex.h-10.w-full.rounded-md.border.border-input.bg-background.px-3.py-2.text-base.ring-offset-background[id=\"firstName\"][name=\"firstName\"]",
 44 |       "key": "Tab",
 45 |       "xpath": "id(\"firstName\")",
 46 |       "elementTag": "INPUT"
 47 |     },
 48 |     {
 49 |       "description": "Tab through the middle name field.",
 50 |       "output": null,
 51 |       "timestamp": 1747409678417,
 52 |       "tabId": 1417505019,
 53 |       "type": "key_press",
 54 |       "cssSelector": "input.flex.h-10.w-full.rounded-md.border.border-input.bg-background.px-3.py-2.text-base.ring-offset-background[id=\"middleName\"][name=\"middleName\"]",
 55 |       "key": "Tab",
 56 |       "xpath": "id(\"middleName\")",
 57 |       "elementTag": "INPUT"
 58 |     },
 59 |     {
 60 |       "description": "Enter the last name into the form.",
 61 |       "output": null,
 62 |       "timestamp": 1747409678926,
 63 |       "tabId": 1417505019,
 64 |       "type": "input",
 65 |       "cssSelector": "input.flex.h-10.w-full.rounded-md.border.border-input.bg-background.px-3.py-2.text-base.ring-offset-background[id=\"lastName\"][name=\"lastName\"]",
 66 |       "value": "{last_name}",
 67 |       "xpath": "id(\"lastName\")",
 68 |       "elementTag": "INPUT"
 69 |     },
 70 |     {
 71 |       "description": "Click to focus on the Social Security field.",
 72 |       "output": null,
 73 |       "timestamp": 1747409680009,
 74 |       "tabId": 1417505019,
 75 |       "type": "click",
 76 |       "cssSelector": "input.flex.h-10.w-full.rounded-md.border.border-input.bg-background.px-3.py-2.text-base.ring-offset-background[id=\"socialSecurityLast4\"][name=\"socialSecurityLast4\"]",
 77 |       "xpath": "id(\"socialSecurityLast4\")",
 78 |       "elementTag": "INPUT",
 79 |       "elementText": null
 80 |     },
 81 |     {
 82 |       "description": "Enter the last 4 digits of the Social Security number.",
 83 |       "output": null,
 84 |       "timestamp": 1747409680292,
 85 |       "tabId": 1417505019,
 86 |       "type": "input",
 87 |       "cssSelector": "input.flex.h-10.w-full.rounded-md.border.border-input.bg-background.px-3.py-2.text-base.ring-offset-background[id=\"socialSecurityLast4\"][name=\"socialSecurityLast4\"]",
 88 |       "value": "{social_security_last4}",
 89 |       "xpath": "id(\"socialSecurityLast4\")",
 90 |       "elementTag": "INPUT"
 91 |     },
 92 |     {
 93 |       "description": "Select 'Male' as the gender.",
 94 |       "output": null,
 95 |       "timestamp": 1747409681493,
 96 |       "tabId": 1417505019,
 97 |       "type": "click",
 98 |       "cssSelector": "button.aspect-square.h-4.w-4.rounded-full.border.border-primary.text-primary.ring-offset-background[type=\"button\"][role=\"radio\"][id=\"male\"]",
 99 |       "xpath": "id(\"male\")",
100 |       "elementTag": "BUTTON",
101 |       "elementText": null
102 |     },
103 |     {
104 |       "description": "Select 'Single' as the marital status.",
105 |       "output": null,
106 |       "timestamp": 1747409682216,
107 |       "tabId": 1417505019,
108 |       "type": "click",
109 |       "cssSelector": "button.aspect-square.h-4.w-4.rounded-full.border.border-primary.text-primary.ring-offset-background[type=\"button\"][role=\"radio\"][id=\"single\"]",
110 |       "xpath": "id(\"single\")",
111 |       "elementTag": "BUTTON",
112 |       "elementText": null
113 |     }
114 |   ],
115 |   "input_schema": [
116 |     {
117 |       "name": "first_name",
118 |       "type": "string",
119 |       "required": true
120 |     },
121 |     {
122 |       "name": "last_name",
123 |       "type": "string",
124 |       "required": true
125 |     },
126 |     {
127 |       "name": "social_security_last4",
128 |       "type": "string",
129 |       "required": true
130 |     }
131 |   ]
132 | }


--------------------------------------------------------------------------------
/workflows/examples/runner.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | 
 3 | from workflow_use.workflow.service import Workflow
 4 | 
 5 | 
 6 | async def main():
 7 | 	workflow = Workflow.load_from_file('examples/example.workflow.json')
 8 | 	print(workflow)
 9 | 
10 | 	first_name = 'John'
11 | 	last_name = 'Doe'
12 | 	social_security_last4 = '1234'
13 | 
14 | 	await workflow.run(
15 | 		inputs={'first_name': first_name, 'last_name': last_name, 'social_security_last4': social_security_last4},
16 | 		close_browser_at_end=False,
17 | 	)
18 | 
19 | 
20 | if __name__ == '__main__':
21 | 	asyncio.run(main())
22 | 


--------------------------------------------------------------------------------
/workflows/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [project]
 2 | name = "workflow-use"
 3 | version = "0.0.2"
 4 | authors = [{ name = "Gregor Zunic" }]
 5 | description = "Create, edit, run deterministic workflows"
 6 | readme = "README.md"
 7 | requires-python = ">=3.11"
 8 | classifiers = [
 9 |     "Programming Language :: Python :: 3",
10 |     "License :: OSI Approved",
11 |     "Operating System :: OS Independent",
12 | ]
13 | 
14 | dependencies = [
15 |     "aiofiles>=24.1.0",
16 |     "browser-use>=0.2.4",
17 |     "fastapi>=0.115.12",
18 |     "fastmcp>=2.3.4",
19 |     "typer>=0.15.3",
20 |     "uvicorn>=0.34.2",
21 | ]
22 | 
23 | 
24 | [tool.uv]
25 | dev-dependencies = [
26 |     "build>=1.2.2.post1",
27 |     "ruff>=0.11.8",
28 | ]
29 | 
30 | [tool.codespell]
31 | ignore-words-list = "bu"
32 | skip = "*.json"
33 | 
34 | [tool.ruff]
35 | line-length = 130
36 | fix = true
37 | 
38 | [tool.ruff.lint]
39 | select = ["ASYNC", "E", "F", "FAST", "I", "PLE"]
40 | ignore = ["ASYNC109", "E101", "E402", "E501", "F841", "E731"]  # TODO: determine if adding timeouts to all the unbounded async functions is needed / worth-it so we can un-ignore ASYNC109
41 | unfixable = ["E101", "E402", "E501", "F841", "E731"]
42 | 
43 | [tool.ruff.format]
44 | quote-style = "single"
45 | indent-style = "tab"
46 | docstring-code-format = true
47 | 
48 | [tool.pyright]
49 | typeCheckingMode = "basic"
50 | 
51 | [build-system]
52 | requires = ["hatchling"]
53 | build-backend = "hatchling.build"
54 | 
55 | [tool.hatch.build]
56 | include = [
57 |     "workflow_use/**/*.py"
58 | ]
59 | 
60 | [tool.hatch.metadata]
61 | allow-direct-references = true
62 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/__init__.py:
--------------------------------------------------------------------------------
1 | from workflow_use.schema.views import WorkflowDefinitionSchema
2 | from workflow_use.workflow.service import Workflow
3 | 
4 | __all__ = ['WorkflowDefinitionSchema', 'Workflow']
5 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/builder/prompts.py:
--------------------------------------------------------------------------------
 1 | WORKFLOW_BUILDER_PROMPT_TEMPLATE = """\
 2 | You are a senior software engineer working with the *browser-use* open-source library.
 3 | Your task is to convert a JSON recording of browser events (provided in subsequent messages) into an
 4 | *executable JSON workflow* that the runtime can consume **directly**.
 5 | 
 6 | Input Steps Format:
 7 | - Each step from the input recording will be provided in a separate message.
 8 | - The message will contain the JSON representation of the step.
 9 | - If a screenshot is available and relevant for that step, it will follow the JSON in the format:
10 |     <Screenshot for event type 'TYPE'>
11 |     [Image Data]
12 | 
13 | Follow these rules when generating the output JSON:
14 | 0. The first thing you will output is the "workflow_analysis". First analyze the original workflow recording, what it is about and create a general analysis of the workflow. Also think about which variables are going to be needed for the workflow.
15 | 1. Top-level keys: "workflow_analysis", "name", "description", "input_schema", "steps" and "version".
16 |    - "input_schema" - MUST follow JSON-Schema draft-7 subset semantics:
17 |        [
18 |          {{"name": "foo", "type": "string", "required": true}}, 
19 |          {{"name": "bar", "type": "number"}}, 
20 |          ...
21 |        ]
22 |    - Always aim to include at least one input in "input_schema" unless the workflow is explicitly static (e.g., always navigates to a fixed URL with no user-driven variability). Base inputs on the user goal, event parameters (e.g., search queries, form inputs), or potential reusable values. For example, if the workflow searches for a term, include an input like {{"name": "search_term", "type": "string", "required": true}}.
23 |    - Only use an empty "input_schema" if no dynamic inputs are relevant after careful analysis. Justify this choice in the "workflow_analysis".
24 | 2. "steps" is an array of dictionaries executed sequentially.
25 |    - Each dictionary MUST include a `"type"` field.
26 |    - **Agentic Steps ("type": "agent")**:
27 |      - Use `"type": "agent"` for tasks where the user must interact with or select from frequently changing content, even if the website’s structure is consistent. Examples include choosing an item from a dynamic list (e.g., a restaurant from search results) or selecting a specific value from a variable set (e.g., a date from a calendar that changes with the month).
28 |      - **MUST** include a `"task"` string describing the user’s goal for the step from their perspective (e.g., "Select the restaurant named {{restaurant_name}} from the search results").
29 |      - Include a `"description"` explaining why agentic reasoning is needed (e.g., "The list of restaurants varies with each search, requiring the agent to find the specified one").
30 |      - Optionally include `"max_steps"` (defaults to 5) to limit agent exploration.
31 |      - **Replace deterministic steps with agentic steps** when the task involves:
32 |        - Selecting from a list or set of options that changes frequently (e.g., restaurants, products, or search results).
33 |        - Interacting with time-sensitive or context-dependent elements (e.g., picking a date from a calendar or a time slot from a schedule).
34 |        - Evaluating content to match user input (e.g., finding a specific item based on its name or attributes).
35 |      - Break complex tasks into multiple specific agentic steps rather than one broad task.
36 |      - **Use the user’s goal (if provided) or inferred intent from the recording** to identify where agentic steps are needed for dynamic content, even if the recording uses deterministic steps.
37 |    - **extract_page_content** - Use this type when you want to extract data from the page. If the task is simply extracting data from the page, use this instead of agentic steps (never create agentic step for simple data extraction).
38 |    - **Deterministic events** → keep the original recorder event structure. The
39 |      value of `"type"` MUST match **exactly** one of the available action
40 |      names listed below; all additional keys are interpreted as parameters for
41 |      that action.
42 |    - For each step you create also add a very short description that describes what the step tries to achieve.  
43 |    - sometimes navigating to a certain url is a side effects of another action (click, submit, key press, etc.). In that case choose either (if you think navigating to the url is the best option) or don't add the step at all.
44 | 3. When referencing workflow inputs inside event parameters or agent tasks use
45 |    the placeholder syntax `{{input_name}}` (e.g. "cssSelector": "#msg-{{row}}")
46 |    – do *not* use any prefix like "input.". Decide the inputs dynamically based on the user's
47 |    goal.
48 | 4. Quote all placeholder values to ensure the JSON parser treats them as
49 |    strings.
50 | 5. In the events you will find all the selectors relative to a particular action, replicate all of them in the workflow.
51 | 6. For many workflows steps you can go directly to certain url and skip the initial clicks (for example searching for something).
52 | 
53 | 
54 | High-level task description provided by the user (may be empty):
55 | {goal}
56 | 
57 | Available actions:
58 | {actions}
59 | 
60 | Input session events will follow one-by-one in subsequent messages.
61 | """
62 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/builder/service.py:
--------------------------------------------------------------------------------
  1 | import base64
  2 | import json
  3 | import logging
  4 | import re
  5 | from pathlib import Path
  6 | from typing import Any, Dict, List, Optional, cast
  7 | 
  8 | from langchain_core.exceptions import OutputParserException
  9 | from langchain_core.language_models import BaseChatModel
 10 | from langchain_core.messages import HumanMessage
 11 | from langchain_core.prompts import PromptTemplate
 12 | from pydantic import ValidationError
 13 | 
 14 | from workflow_use.builder.prompts import WORKFLOW_BUILDER_PROMPT_TEMPLATE
 15 | from workflow_use.controller.service import WorkflowController
 16 | from workflow_use.schema.views import WorkflowDefinitionSchema
 17 | 
 18 | logger = logging.getLogger(__name__)
 19 | 
 20 | 
 21 | class BuilderService:
 22 | 	"""
 23 | 	Service responsible for building executable workflow JSON definitions
 24 | 	from recorded browser session events using an LLM.
 25 | 	"""
 26 | 
 27 | 	def __init__(self, llm: BaseChatModel):
 28 | 		"""
 29 | 		Initializes the BuilderService.
 30 | 
 31 | 		Args:
 32 | 		    llm: A LangChain BaseChatModel instance configured for use.
 33 | 		         It should ideally support vision capabilities if screenshots are used.
 34 | 		"""
 35 | 		if llm is None:
 36 | 			raise ValueError('A BaseChatModel instance must be provided.')
 37 | 
 38 | 		# Configure the LLM to return structured output based on the Pydantic model
 39 | 		try:
 40 | 			# Specify method="function_calling" for better compatibility
 41 | 			self.llm_structured = llm.with_structured_output(WorkflowDefinitionSchema, method='function_calling')
 42 | 		except NotImplementedError:
 43 | 			logger.warning('LLM does not support structured output natively. Falling back.')
 44 | 			# Basic LLM call if structured output is not supported
 45 | 			# Output parsing will be handled manually later
 46 | 			self.llm_structured = llm  # Store the original llm
 47 | 
 48 | 		self.prompt_template = PromptTemplate.from_template(WORKFLOW_BUILDER_PROMPT_TEMPLATE)
 49 | 		self.actions_markdown = self._get_available_actions_markdown()
 50 | 		logger.info('BuilderService initialized.')
 51 | 
 52 | 	def _get_available_actions_markdown(self) -> str:
 53 | 		"""Return a markdown list of available actions and their schema."""
 54 | 		controller = WorkflowController()
 55 | 		lines: List[str] = []
 56 | 		for action in controller.registry.registry.actions.values():
 57 | 			# Only include deterministic actions relevant for building from recordings
 58 | 			# Exclude agent-specific or meta-actions if necessary
 59 | 			# Based on schema/views.py, the recorder types seem to map directly
 60 | 			# to controller action *names*, but the prompt uses the event `type` field.
 61 | 			# Let's assume the prompt template correctly lists the *event types* expected.
 62 | 			# This function provides the detailed schema for the LLM.
 63 | 			schema_info = action.param_model.model_json_schema()
 64 | 			# Simplify schema representation for the prompt if too verbose
 65 | 			param_details = []
 66 | 			props = schema_info.get('properties', {})
 67 | 			required = schema_info.get('required', [])
 68 | 			for name, details in props.items():
 69 | 				req_star = '*' if name in required else ''
 70 | 				param_details.append(f'`{name}`{req_star} ({details.get("type", "any")})')
 71 | 
 72 | 			lines.append(f'- **`{action.name}`**: {action.description}')  # Using action name from controller
 73 | 			if param_details:
 74 | 				lines.append(f'  - Parameters: {", ".join(param_details)}')
 75 | 
 76 | 		# Add descriptions for agent/extract_content types manually if not in controller
 77 | 		if 'agent' not in [a.name for a in controller.registry.registry.actions.values()]:
 78 | 			lines.append('- **`agent`**: Executes a task using an autonomous agent.')
 79 | 			lines.append('  - Parameters: `task`* (string), `description` (string), `max_steps` (integer)')
 80 | 		# if "extract_content" not in [
 81 | 		#     a.name for a in controller.registry.registry.actions.values()
 82 | 		# ]:
 83 | 		#     lines.append(
 84 | 		#         "- **`extract_content`**: Uses an LLM to extract specific information from the current page."
 85 | 		#     )
 86 | 		#     lines.append(
 87 | 		#         "  - Parameters: `goal`* (string), `description` (string), `should_strip_link_urls` (boolean)"
 88 | 		#     )
 89 | 
 90 | 		logger.debug(f'Generated actions markdown:\n{lines}')
 91 | 		return '\n'.join(lines)
 92 | 
 93 | 	@staticmethod
 94 | 	def _find_first_user_interaction_url(events: List[Dict[str, Any]]) -> Optional[str]:
 95 | 		"""Finds the URL of the first recorded user interaction."""
 96 | 		return next(
 97 | 			(
 98 | 				evt.get('frameUrl')
 99 | 				for evt in events
100 | 				if evt.get('type')
101 | 				in [
102 | 					'input',
103 | 					'click',
104 | 					'scroll',
105 | 					'select_change',
106 | 					'key_press',
107 | 				]  # Added more types
108 | 			),
109 | 			None,
110 | 		)
111 | 
112 | 	def _parse_llm_output_to_workflow(self, llm_content: str) -> WorkflowDefinitionSchema:
113 | 		"""Attempts to parse the LLM string output into a WorkflowDefinitionSchema."""
114 | 		logger.debug(f'Raw LLM Output:\n{llm_content}')
115 | 		content_to_parse = llm_content
116 | 
117 | 		# Heuristic cleanup: Extract JSON from markdown code blocks
118 | 		if '```json' in content_to_parse:
119 | 			match = re.search(r'```json\s*([\s\S]*?)\s*```', content_to_parse, re.DOTALL)
120 | 			if match:
121 | 				content_to_parse = match.group(1).strip()
122 | 				logger.debug('Extracted JSON from ```json block.')
123 | 		elif content_to_parse.strip().startswith('{') and content_to_parse.strip().endswith('}'):
124 | 			# Assume it's already JSON if it looks like it
125 | 			content_to_parse = content_to_parse.strip()
126 | 			logger.debug('Assuming raw output is JSON.')
127 | 		else:
128 | 			logger.warning('Could not reliably extract JSON from LLM output, attempting parse anyway.')
129 | 
130 | 		try:
131 | 			# Try parsing directly first (might work with structured output)
132 | 			workflow_data = WorkflowDefinitionSchema.model_validate_json(content_to_parse)
133 | 			logger.info('Successfully parsed LLM output into WorkflowDefinitionSchema.')
134 | 			return workflow_data
135 | 		except (json.JSONDecodeError, ValidationError) as e:
136 | 			logger.error(f'Failed to parse LLM output into WorkflowDefinitionSchema: {e}')
137 | 			logger.debug(f'Content attempted parsing:\n{content_to_parse}')
138 | 			raise ValueError(f'LLM output could not be parsed into a valid Workflow schema. Error: {e}') from e
139 | 
140 | 	async def build_workflow(
141 | 		self,
142 | 		input_workflow: WorkflowDefinitionSchema,
143 | 		user_goal: str,
144 | 		use_screenshots: bool = False,
145 | 		max_images: int = 20,
146 | 	) -> WorkflowDefinitionSchema:
147 | 		"""
148 | 		Generates an enhanced Workflow definition from an input workflow object using an LLM.
149 | 
150 | 		Args:
151 | 		    input_workflow: The initial WorkflowDefinitionSchema object containing steps to process.
152 | 		    user_goal: Optional high-level description of the workflow's purpose.
153 | 		               If None, the user might be prompted interactively.
154 | 		    use_screenshots: Whether to include screenshots as visual context for the LLM (if available in steps).
155 | 		    max_images: Maximum number of screenshots to include (to manage cost/tokens).
156 | 
157 | 		Returns:
158 | 		    A new WorkflowDefinitionSchema object generated by the LLM.
159 | 
160 | 		Raises:
161 | 		    ValueError: If the input workflow is invalid or the LLM output cannot be parsed.
162 | 		    Exception: For other LLM or processing errors.
163 | 		"""
164 | 		# Validate input slightly
165 | 		if not input_workflow or not isinstance(input_workflow.steps, list):
166 | 			raise ValueError('Invalid input_workflow object provided.')
167 | 
168 | 		# Handle user goal
169 | 		goal = user_goal
170 | 		if goal is None:
171 | 			try:
172 | 				goal = input('Please describe the high-level task for the workflow (optional, press Enter to skip): ').strip()
173 | 			except EOFError:  # Handle non-interactive environments
174 | 				goal = ''
175 | 		goal = goal or 'Automate the recorded browser actions.'  # Default goal if empty
176 | 
177 | 		# Format the main instruction prompt
178 | 		prompt_str = self.prompt_template.format(
179 | 			actions=self.actions_markdown,
180 | 			goal=goal,
181 | 		)
182 | 
183 | 		# Prepare the vision messages list
184 | 		vision_messages: List[Dict[str, Any]] = [{'type': 'text', 'text': prompt_str}]
185 | 
186 | 		# Integrate message preparation logic here
187 | 		images_used = 0
188 | 		for step in input_workflow.steps:
189 | 			step_messages: List[Dict[str, Any]] = []  # Messages for this specific step
190 | 
191 | 			# 1. Text representation (JSON dump)
192 | 			step_dict = step.model_dump(mode='json', exclude_none=True)
193 | 			screenshot_data = step_dict.pop('screenshot', None)  # Pop potential screenshot
194 | 			step_messages.append({'type': 'text', 'text': json.dumps(step_dict, indent=2)})
195 | 
196 | 			# 2. Optional screenshot
197 | 			attach_image = use_screenshots and images_used < max_images
198 | 			step_type = getattr(step, 'type', step_dict.get('type'))
199 | 
200 | 			if attach_image and step_type != 'input':  # Don't attach for inputs
201 | 				# Re-retrieve screenshot data if it wasn't popped (e.g., nested under 'data')
202 | 				# This assumes screenshot might still be in the original step model or dict
203 | 				# A bit redundant, ideally screenshot handling is consistent
204 | 				screenshot = screenshot_data or getattr(step, 'screenshot', None) or step_dict.get('data', {}).get('screenshot')
205 | 
206 | 				if screenshot:
207 | 					if isinstance(screenshot, str) and screenshot.startswith('data:'):
208 | 						screenshot = screenshot.split(',', 1)[-1]
209 | 
210 | 					# Validate base64 payload
211 | 					try:
212 | 						base64.b64decode(cast(str, screenshot), validate=True)
213 | 						meta = f"<Screenshot for event type '{step_type}'>"
214 | 						step_messages.append({'type': 'text', 'text': meta})
215 | 						step_messages.append(
216 | 							{
217 | 								'type': 'image_url',
218 | 								'image_url': {'url': f'data:image/png;base64,{screenshot}'},
219 | 							}
220 | 						)
221 | 						images_used += 1  # Increment image count *only* if successfully added
222 | 					except (TypeError, ValueError, Exception) as e:
223 | 						logger.warning(
224 | 							f"Invalid or missing screenshot for step type '{step_type}' "
225 | 							f'@ {step_dict.get("timestamp", "")}. Error: {e}'
226 | 						)
227 | 						# Don't add image messages if invalid
228 | 
229 | 			# Add the messages for this step to the main list
230 | 			vision_messages.extend(step_messages)
231 | 
232 | 		logger.info(f'Prepared {len(vision_messages)} total message parts, including {images_used} images.')
233 | 
234 | 		# Invoke the LLM (structured output preferred)
235 | 		try:
236 | 			# Invoke the LLM (structured output preferred)
237 | 			# Need to handle cases where structured output isn't truly supported
238 | 			if hasattr(self.llm_structured, 'output_schema'):  # Check if it seems like structured output model
239 | 				llm_response = await self.llm_structured.ainvoke([HumanMessage(content=cast(Any, vision_messages))])
240 | 				# If structured output worked, llm_response is the Pydantic object
241 | 				if isinstance(llm_response, WorkflowDefinitionSchema):
242 | 					workflow_data = llm_response
243 | 				else:
244 | 					# It might have returned a message or dict, try parsing its content
245 | 					content = getattr(llm_response, 'content', str(llm_response))
246 | 					workflow_data = self._parse_llm_output_to_workflow(str(content))
247 | 			else:
248 | 				# Fallback to basic LLM call and manual parsing
249 | 				llm_response = await self.llm_structured.ainvoke([HumanMessage(content=cast(Any, vision_messages))])
250 | 				llm_content = str(getattr(llm_response, 'content', llm_response))  # Get string content
251 | 				workflow_data = self._parse_llm_output_to_workflow(llm_content)
252 | 
253 | 		except OutputParserException as ope:
254 | 			logger.error(f'LLM output parsing failed (OutputParserException): {ope}')
255 | 			# Try to parse the raw output as a fallback
256 | 			raw_output = getattr(ope, 'llm_output', str(ope))
257 | 			logger.info('Attempting to parse raw output as fallback...')
258 | 			try:
259 | 				workflow_data = self._parse_llm_output_to_workflow(raw_output)
260 | 			except ValueError as ve_fallback:
261 | 				raise ValueError(
262 | 					f'LLM structured output failed, and fallback parsing also failed. Error: {ve_fallback}'
263 | 				) from ve_fallback
264 | 		except Exception as e:
265 | 			logger.exception(f'An error occurred during LLM invocation or processing: {e}')
266 | 			raise  # Re-raise other unexpected errors
267 | 
268 | 		# Return the workflow data object directly
269 | 		return workflow_data
270 | 
271 | 	# path handlers
272 | 	async def build_workflow_from_path(self, path: Path, user_goal: str) -> WorkflowDefinitionSchema:
273 | 		"""Build a workflow from a JSON file path."""
274 | 		with open(path, 'r') as f:
275 | 			workflow_data = json.load(f)
276 | 
277 | 		workflow_data_schema = WorkflowDefinitionSchema.model_validate(workflow_data)
278 | 		return await self.build_workflow(workflow_data_schema, user_goal)
279 | 
280 | 	async def save_workflow_to_path(self, workflow: WorkflowDefinitionSchema, path: Path):
281 | 		"""Save a workflow to a JSON file path."""
282 | 		with open(path, 'w') as f:
283 | 			json.dump(workflow.model_dump(mode='json'), f, indent=2)
284 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/builder/tests/build_workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | # Ensure langchain-openai is installed and OPENAI_API_KEY is set
 5 | from langchain_openai import ChatOpenAI
 6 | 
 7 | from workflow_use.builder.service import BuilderService
 8 | 
 9 | # Instantiate the LLM and the service directly
10 | llm_instance = ChatOpenAI(model='gpt-4o')  # Or your preferred model
11 | builder_service = BuilderService(llm=llm_instance)
12 | 
13 | 
14 | async def test_build_workflow_from_path():
15 | 	"""
16 | 	Tests that the workflow is built correctly from a JSON file path.
17 | 	"""
18 | 	path = Path(__file__).parent / 'tmp' / 'recording.json'
19 | 	workflow_definition = await builder_service.build_workflow_from_path(
20 | 		path,
21 | 		'go to apple.com and extract the price of the iphone XY (where XY is a variable)',
22 | 	)
23 | 
24 | 	print(workflow_definition)
25 | 
26 | 	output_path = path.with_suffix('.workflow.json')
27 | 	await builder_service.save_workflow_to_path(workflow_definition, output_path)
28 | 
29 | 
30 | if __name__ == '__main__':
31 | 	asyncio.run(test_build_workflow_from_path())
32 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/controller/service.py:
--------------------------------------------------------------------------------
  1 | import asyncio
  2 | import logging
  3 | 
  4 | from browser_use import Browser
  5 | from browser_use.agent.views import ActionResult
  6 | from browser_use.controller.service import Controller
  7 | from langchain_core.language_models.chat_models import BaseChatModel
  8 | from langchain_core.prompts import PromptTemplate
  9 | 
 10 | from workflow_use.controller.utils import get_best_element_handle, truncate_selector
 11 | from workflow_use.controller.views import (
 12 | 	ClickElementDeterministicAction,
 13 | 	InputTextDeterministicAction,
 14 | 	KeyPressDeterministicAction,
 15 | 	NavigationAction,
 16 | 	PageExtractionAction,
 17 | 	ScrollDeterministicAction,
 18 | 	SelectDropdownOptionDeterministicAction,
 19 | )
 20 | 
 21 | logger = logging.getLogger(__name__)
 22 | 
 23 | DEFAULT_ACTION_TIMEOUT_MS = 1000
 24 | 
 25 | # List of default actions from browser_use.controller.service.Controller to disable
 26 | # todo: come up with a better way to filter out the actions (filter IN the actions would be much nicer in this case)
 27 | DISABLED_DEFAULT_ACTIONS = [
 28 | 	'done',
 29 | 	'search_google',
 30 | 	'go_to_url',  # I am using this action from the main controller to avoid duplication
 31 | 	'go_back',
 32 | 	'wait',
 33 | 	'click_element_by_index',
 34 | 	'input_text',
 35 | 	'save_pdf',
 36 | 	'switch_tab',
 37 | 	'open_tab',
 38 | 	'close_tab',
 39 | 	'extract_content',
 40 | 	'scroll_down',
 41 | 	'scroll_up',
 42 | 	'send_keys',
 43 | 	'scroll_to_text',
 44 | 	'get_dropdown_options',
 45 | 	'select_dropdown_option',
 46 | 	'drag_drop',
 47 | 	'get_sheet_contents',
 48 | 	'select_cell_or_range',
 49 | 	'get_range_contents',
 50 | 	'clear_selected_range',
 51 | 	'input_selected_cell_text',
 52 | 	'update_range_contents',
 53 | ]
 54 | 
 55 | 
 56 | class WorkflowController(Controller):
 57 | 	def __init__(self, *args, **kwargs):
 58 | 		# Pass the list of actions to exclude to the base class constructor
 59 | 		super().__init__(*args, exclude_actions=DISABLED_DEFAULT_ACTIONS, **kwargs)
 60 | 		self.__register_actions()
 61 | 
 62 | 	def __register_actions(self):
 63 | 		# Navigate to URL ------------------------------------------------------------
 64 | 		@self.registry.action('Manually navigate to URL', param_model=NavigationAction)
 65 | 		async def navigation(params: NavigationAction, browser_session: Browser) -> ActionResult:
 66 | 			"""Navigate to the given URL."""
 67 | 			page = await browser_session.get_current_page()
 68 | 			await page.goto(params.url)
 69 | 			await page.wait_for_load_state()
 70 | 
 71 | 			msg = f'🔗  Navigated to URL: {params.url}'
 72 | 			logger.info(msg)
 73 | 			return ActionResult(extracted_content=msg, include_in_memory=True)
 74 | 
 75 | 		# Click element by CSS selector --------------------------------------------------
 76 | 
 77 | 		@self.registry.action(
 78 | 			'Click element by all available selectors',
 79 | 			param_model=ClickElementDeterministicAction,
 80 | 		)
 81 | 		async def click(params: ClickElementDeterministicAction, browser_session: Browser) -> ActionResult:
 82 | 			"""Click the first element matching *params.cssSelector* with fallback mechanisms."""
 83 | 			page = await browser_session.get_current_page()
 84 | 			original_selector = params.cssSelector
 85 | 
 86 | 			try:
 87 | 				locator, selector_used = await get_best_element_handle(
 88 | 					page,
 89 | 					params.cssSelector,
 90 | 					params,
 91 | 					timeout_ms=DEFAULT_ACTION_TIMEOUT_MS,
 92 | 				)
 93 | 				await locator.click(force=True)
 94 | 
 95 | 				msg = f'🖱️  Clicked element with CSS selector: {truncate_selector(selector_used)} (original: {truncate_selector(original_selector)})'
 96 | 				logger.info(msg)
 97 | 				return ActionResult(extracted_content=msg, include_in_memory=True)
 98 | 			except Exception as e:
 99 | 				error_msg = f'Failed to click element. Original selector: {truncate_selector(original_selector)}. Error: {str(e)}'
100 | 				logger.error(error_msg)
101 | 				raise Exception(error_msg)
102 | 
103 | 		# Input text into element --------------------------------------------------------
104 | 		@self.registry.action(
105 | 			'Input text into an element by all available selectors',
106 | 			param_model=InputTextDeterministicAction,
107 | 		)
108 | 		async def input(
109 | 			params: InputTextDeterministicAction,
110 | 			browser_session: Browser,
111 | 			has_sensitive_data: bool = False,
112 | 		) -> ActionResult:
113 | 			"""Fill text into the element located with *params.cssSelector*."""
114 | 			page = await browser_session.get_current_page()
115 | 			original_selector = params.cssSelector
116 | 
117 | 			try:
118 | 				locator, selector_used = await get_best_element_handle(
119 | 					page,
120 | 					params.cssSelector,
121 | 					params,
122 | 					timeout_ms=DEFAULT_ACTION_TIMEOUT_MS,
123 | 				)
124 | 
125 | 				# Check if it's a SELECT element
126 | 				is_select = await locator.evaluate('(el) => el.tagName === "SELECT"')
127 | 				if is_select:
128 | 					return ActionResult(
129 | 						extracted_content='Ignored input into select element',
130 | 						include_in_memory=True,
131 | 					)
132 | 
133 | 				# Add a small delay and click to ensure the element is focused
134 | 				await locator.fill(params.value)
135 | 				await asyncio.sleep(0.5)
136 | 				await locator.click(force=True)
137 | 				await asyncio.sleep(0.5)
138 | 
139 | 				msg = f'⌨️  Input "{params.value}" into element with CSS selector: {truncate_selector(selector_used)} (original: {truncate_selector(original_selector)})'
140 | 				logger.info(msg)
141 | 				return ActionResult(extracted_content=msg, include_in_memory=True)
142 | 			except Exception as e:
143 | 				error_msg = f'Failed to input text. Original selector: {truncate_selector(original_selector)}. Error: {str(e)}'
144 | 				logger.error(error_msg)
145 | 				raise Exception(error_msg)
146 | 
147 | 		# Select dropdown option ---------------------------------------------------------
148 | 		@self.registry.action(
149 | 			'Select dropdown option by all available selectors and visible text',
150 | 			param_model=SelectDropdownOptionDeterministicAction,
151 | 		)
152 | 		async def select_change(params: SelectDropdownOptionDeterministicAction, browser_session: Browser) -> ActionResult:
153 | 			"""Select dropdown option whose visible text equals *params.value*."""
154 | 			page = await browser_session.get_current_page()
155 | 			original_selector = params.cssSelector
156 | 
157 | 			try:
158 | 				locator, selector_used = await get_best_element_handle(
159 | 					page,
160 | 					params.cssSelector,
161 | 					params,
162 | 					timeout_ms=DEFAULT_ACTION_TIMEOUT_MS,
163 | 				)
164 | 
165 | 				await locator.select_option(label=params.selectedText)
166 | 
167 | 				msg = f'Selected option "{params.selectedText}" in dropdown {truncate_selector(selector_used)} (original: {truncate_selector(original_selector)})'
168 | 				logger.info(msg)
169 | 				return ActionResult(extracted_content=msg, include_in_memory=True)
170 | 			except Exception as e:
171 | 				error_msg = f'Failed to select option. Original selector: {truncate_selector(original_selector)}. Error: {str(e)}'
172 | 				logger.error(error_msg)
173 | 				raise Exception(error_msg)
174 | 
175 | 		# Key press action ------------------------------------------------------------
176 | 		@self.registry.action(
177 | 			'Press key on element by all available selectors',
178 | 			param_model=KeyPressDeterministicAction,
179 | 		)
180 | 		async def key_press(params: KeyPressDeterministicAction, browser_session: Browser) -> ActionResult:
181 | 			"""Press *params.key* on the element identified by *params.cssSelector*."""
182 | 			page = await browser_session.get_current_page()
183 | 			original_selector = params.cssSelector
184 | 
185 | 			try:
186 | 				locator, selector_used = await get_best_element_handle(page, params.cssSelector, params, timeout_ms=5000)
187 | 
188 | 				await locator.press(params.key)
189 | 
190 | 				msg = f"🔑  Pressed key '{params.key}' on element with CSS selector: {truncate_selector(selector_used)} (original: {truncate_selector(original_selector)})"
191 | 				logger.info(msg)
192 | 				return ActionResult(extracted_content=msg, include_in_memory=True)
193 | 			except Exception as e:
194 | 				error_msg = f'Failed to press key. Original selector: {truncate_selector(original_selector)}. Error: {str(e)}'
195 | 				logger.error(error_msg)
196 | 				raise Exception(error_msg)
197 | 
198 | 		# Scroll action --------------------------------------------------------------
199 | 		@self.registry.action('Scroll page', param_model=ScrollDeterministicAction)
200 | 		async def scroll(params: ScrollDeterministicAction, browser_session: Browser) -> ActionResult:
201 | 			"""Scroll the page by the given x/y pixel offsets."""
202 | 			page = await browser_session.get_current_page()
203 | 			await page.evaluate(f'window.scrollBy({params.scrollX}, {params.scrollY});')
204 | 			msg = f'📜  Scrolled page by (x={params.scrollX}, y={params.scrollY})'
205 | 			logger.info(msg)
206 | 			return ActionResult(extracted_content=msg, include_in_memory=True)
207 | 
208 | 			# Extract content ------------------------------------------------------------
209 | 
210 | 		@self.registry.action(
211 | 			'Extract page content to retrieve specific information from the page, e.g. all company names, a specific description, all information about, links with companies in structured format or simply links',
212 | 			param_model=PageExtractionAction,
213 | 		)
214 | 		async def extract_page_content(
215 | 			params: PageExtractionAction, browser_session: Browser, page_extraction_llm: BaseChatModel
216 | 		):
217 | 			page = await browser_session.get_current_page()
218 | 			import markdownify
219 | 
220 | 			strip = ['a', 'img']
221 | 
222 | 			content = markdownify.markdownify(await page.content(), strip=strip)
223 | 
224 | 			# manually append iframe text into the content so it's readable by the LLM (includes cross-origin iframes)
225 | 			for iframe in page.frames:
226 | 				if iframe.url != page.url and not iframe.url.startswith('data:'):
227 | 					content += f'\n\nIFRAME {iframe.url}:\n'
228 | 					content += markdownify.markdownify(await iframe.content())
229 | 
230 | 			prompt = 'Your task is to extract the content of the page. You will be given a page and a goal and you should extract all relevant information around this goal from the page. If the goal is vague, summarize the page. Respond in json format. Extraction goal: {goal}, Page: {page}'
231 | 			template = PromptTemplate(input_variables=['goal', 'page'], template=prompt)
232 | 			try:
233 | 				output = await page_extraction_llm.ainvoke(template.format(goal=params.goal, page=content))
234 | 				msg = f'📄  Extracted from page\n: {output.content}\n'
235 | 				logger.info(msg)
236 | 				return ActionResult(extracted_content=msg, include_in_memory=True)
237 | 			except Exception as e:
238 | 				logger.debug(f'Error extracting content: {e}')
239 | 				msg = f'📄  Extracted from page\n: {content}\n'
240 | 				logger.info(msg)
241 | 				return ActionResult(extracted_content=msg)
242 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/controller/utils.py:
--------------------------------------------------------------------------------
  1 | import logging
  2 | import re
  3 | 
  4 | logger = logging.getLogger(__name__)
  5 | 
  6 | 
  7 | def truncate_selector(selector: str, max_length: int = 35) -> str:
  8 | 	"""Truncate a CSS selector to a maximum length, adding ellipsis if truncated."""
  9 | 	return selector if len(selector) <= max_length else f'{selector[:max_length]}...'
 10 | 
 11 | 
 12 | async def get_best_element_handle(page, selector, params=None, timeout_ms=500):
 13 | 	"""Find element using stability-ranked selector strategies."""
 14 | 	original_selector = selector
 15 | 
 16 | 	# Generate stability-ranked fallback selectors
 17 | 	fallbacks = generate_stable_selectors(selector, params)
 18 | 
 19 | 	# Try all selectors with exponential backoff for timeouts
 20 | 	selectors_to_try = [original_selector] + fallbacks
 21 | 
 22 | 	for try_selector in selectors_to_try:
 23 | 		try:
 24 | 			logger.info(f'Trying selector: {truncate_selector(try_selector)}')
 25 | 			locator = page.locator(try_selector)
 26 | 			await locator.wait_for(state='visible', timeout=timeout_ms)
 27 | 			logger.info(f'Found element with selector: {truncate_selector(try_selector)}')
 28 | 			return locator, try_selector
 29 | 		except Exception as e:
 30 | 			logger.error(f'Selector failed: {truncate_selector(try_selector)} with error: {e}')
 31 | 
 32 | 	# Try XPath as last resort
 33 | 	if params and getattr(params, 'xpath', None):
 34 | 		xpath = params.xpath
 35 | 		try:
 36 | 			# Generate stable XPath alternatives
 37 | 			xpath_alternatives = [xpath] + generate_stable_xpaths(xpath, params)
 38 | 
 39 | 			for try_xpath in xpath_alternatives:
 40 | 				xpath_selector = f'xpath={try_xpath}'
 41 | 				logger.info(f'Trying XPath: {truncate_selector(xpath_selector)}')
 42 | 				locator = page.locator(xpath_selector)
 43 | 				await locator.wait_for(state='visible', timeout=timeout_ms)
 44 | 				return locator, xpath_selector
 45 | 		except Exception as e:
 46 | 			logger.error(f'All XPaths failed with error: {e}')
 47 | 
 48 | 	raise Exception(f'Failed to find element. Original: {original_selector}')
 49 | 
 50 | 
 51 | def generate_stable_selectors(selector, params=None):
 52 | 	"""Generate selectors from most to least stable based on selector patterns."""
 53 | 	fallbacks = []
 54 | 
 55 | 	# 1. Extract attribute-based selectors (most stable)
 56 | 	attributes_to_check = [
 57 | 		'placeholder',
 58 | 		'aria-label',
 59 | 		'name',
 60 | 		'title',
 61 | 		'role',
 62 | 		'data-testid',
 63 | 	]
 64 | 	for attr in attributes_to_check:
 65 | 		attr_pattern = rf'\[{attr}\*?=[\'"]([^\'"]*)[\'"]'
 66 | 		attr_match = re.search(attr_pattern, selector)
 67 | 		if attr_match:
 68 | 			attr_value = attr_match.group(1)
 69 | 			element_tag = extract_element_tag(selector, params)
 70 | 			if element_tag:
 71 | 				fallbacks.append(f'{element_tag}[{attr}*="{attr_value}"]')
 72 | 
 73 | 	# 2. Combine tag + class + one attribute (good stability)
 74 | 	element_tag = extract_element_tag(selector, params)
 75 | 	classes = extract_stable_classes(selector)
 76 | 	for attr in attributes_to_check:
 77 | 		attr_pattern = rf'\[{attr}\*?=[\'"]([^\'"]*)[\'"]'
 78 | 		attr_match = re.search(attr_pattern, selector)
 79 | 		if attr_match and classes and element_tag:
 80 | 			attr_value = attr_match.group(1)
 81 | 			class_selector = '.'.join(classes)
 82 | 			fallbacks.append(f'{element_tag}.{class_selector}[{attr}*="{attr_value}"]')
 83 | 
 84 | 	# 3. Tag + class combination (less stable but often works)
 85 | 	if element_tag and classes:
 86 | 		class_selector = '.'.join(classes)
 87 | 		fallbacks.append(f'{element_tag}.{class_selector}')
 88 | 
 89 | 	# 4. Remove dynamic parts (IDs, state classes)
 90 | 	if '[id=' in selector:
 91 | 		fallbacks.append(re.sub(r'\[id=[\'"].*?[\'"]\]', '', selector))
 92 | 
 93 | 	for state in ['.focus-visible', '.hover', '.active', '.focus', ':focus']:
 94 | 		if state in selector:
 95 | 			fallbacks.append(selector.replace(state, ''))
 96 | 
 97 | 	# 5. Use text-based selector if we have element tag and text
 98 | 	if params and getattr(params, 'elementTag', None) and getattr(params, 'elementText', None) and params.elementText.strip():
 99 | 		fallbacks.append(f"{params.elementTag}:has-text('{params.elementText}')")
100 | 
101 | 	return list(dict.fromkeys(fallbacks))  # Remove duplicates while preserving order
102 | 
103 | 
104 | def extract_element_tag(selector, params=None):
105 | 	"""Extract element tag from selector or params."""
106 | 	# Try to get from selector first
107 | 	tag_match = re.match(r'^([a-zA-Z][a-zA-Z0-9]*)', selector)
108 | 	if tag_match:
109 | 		return tag_match.group(1).lower()
110 | 
111 | 	# Fall back to params
112 | 	if params and getattr(params, 'elementTag', None):
113 | 		return params.elementTag.lower()
114 | 
115 | 	return ''
116 | 
117 | 
118 | def extract_stable_classes(selector):
119 | 	"""Extract classes that appear to be stable (not state-related)."""
120 | 	class_pattern = r'\.([a-zA-Z0-9_-]+)'
121 | 	classes = re.findall(class_pattern, selector)
122 | 
123 | 	# Filter out likely state classes
124 | 	stable_classes = [
125 | 		cls
126 | 		for cls in classes
127 | 		if not any(state in cls.lower() for state in ['focus', 'hover', 'active', 'selected', 'checked', 'disabled'])
128 | 	]
129 | 
130 | 	return stable_classes
131 | 
132 | 
133 | def generate_stable_xpaths(xpath, params=None):
134 | 	"""Generate stable XPath alternatives."""
135 | 	alternatives = []
136 | 
137 | 	# Handle "id()" XPath pattern which is brittle
138 | 	if 'id(' in xpath:
139 | 		element_tag = getattr(params, 'elementTag', '').lower()
140 | 		if element_tag:
141 | 			# Create XPaths based on attributes from params
142 | 			if params and getattr(params, 'cssSelector', None):
143 | 				for attr in ['placeholder', 'aria-label', 'title', 'name']:
144 | 					attr_pattern = rf'\[{attr}\*?=[\'"]([^\'"]*)[\'"]'
145 | 					attr_match = re.search(attr_pattern, params.cssSelector)
146 | 					if attr_match:
147 | 						attr_value = attr_match.group(1)
148 | 						alternatives.append(f"//{element_tag}[contains(@{attr}, '{attr_value}')]")
149 | 
150 | 	return alternatives
151 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/controller/views.py:
--------------------------------------------------------------------------------
 1 | from typing import Literal, Optional
 2 | 
 3 | from pydantic import BaseModel
 4 | 
 5 | 
 6 | # Shared config allowing extra fields so recorder payloads pass through
 7 | class _BaseExtra(BaseModel):
 8 | 	"""Base model ignoring unknown fields."""
 9 | 
10 | 	class Config:
11 | 		extra = 'ignore'
12 | 
13 | 
14 | # Mixin for shared step metadata (timestamp and tab context)
15 | class StepMeta(_BaseExtra):
16 | 	timestamp: int
17 | 	tabId: int
18 | 
19 | 
20 | # Common optional fields present in recorder events
21 | class RecorderBase(StepMeta):
22 | 	xpath: Optional[str] = None
23 | 	elementTag: Optional[str] = None
24 | 	elementText: Optional[str] = None
25 | 	frameUrl: Optional[str] = None
26 | 	screenshot: Optional[str] = None
27 | 
28 | 
29 | class ClickElementDeterministicAction(RecorderBase):
30 | 	"""Parameters for clicking an element identified by CSS selector."""
31 | 
32 | 	type: Literal['click']
33 | 	cssSelector: str
34 | 
35 | 
36 | class InputTextDeterministicAction(RecorderBase):
37 | 	"""Parameters for entering text into an input field identified by CSS selector."""
38 | 
39 | 	type: Literal['input']
40 | 	cssSelector: str
41 | 	value: str
42 | 
43 | 
44 | class SelectDropdownOptionDeterministicAction(RecorderBase):
45 | 	"""Parameters for selecting a dropdown option identified by *selector* and *text*."""
46 | 
47 | 	type: Literal['select_change']
48 | 	cssSelector: str
49 | 	selectedValue: str
50 | 	selectedText: str
51 | 
52 | 
53 | class KeyPressDeterministicAction(RecorderBase):
54 | 	"""Parameters for pressing a key on an element identified by CSS selector."""
55 | 
56 | 	type: Literal['key_press']
57 | 	cssSelector: str
58 | 	key: str
59 | 
60 | 
61 | class NavigationAction(_BaseExtra):
62 | 	"""Parameters for navigating to a URL."""
63 | 
64 | 	type: Literal['navigation']
65 | 	url: str
66 | 
67 | 
68 | class ScrollDeterministicAction(_BaseExtra):
69 | 	"""Parameters for scrolling the page by x/y offsets (pixels)."""
70 | 
71 | 	type: Literal['scroll']
72 | 	scrollX: int = 0
73 | 	scrollY: int = 0
74 | 	targetId: Optional[int] = None
75 | 
76 | 
77 | class PageExtractionAction(_BaseExtra):
78 | 	"""Parameters for extracting content from the page."""
79 | 
80 | 	type: Literal['extract_page_content']
81 | 	goal: str
82 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/mcp/service.py:
--------------------------------------------------------------------------------
  1 | import json as _json
  2 | from inspect import Parameter, Signature
  3 | from pathlib import Path
  4 | from typing import Any
  5 | 
  6 | from fastmcp import FastMCP
  7 | from langchain_core.language_models.chat_models import BaseChatModel
  8 | 
  9 | from workflow_use.schema.views import WorkflowDefinitionSchema
 10 | from workflow_use.workflow.service import Workflow
 11 | 
 12 | 
 13 | def get_mcp_server(
 14 | 	llm_instance: BaseChatModel,
 15 | 	page_extraction_llm: BaseChatModel | None = None,
 16 | 	workflow_dir: str = './tmp',
 17 | 	name: str = 'WorkflowService',
 18 | 	description: str = 'Exposes workflows as MCP tools.',
 19 | ):
 20 | 	mcp_app = FastMCP(name=name, description=description)
 21 | 
 22 | 	_setup_workflow_tools(mcp_app, llm_instance, page_extraction_llm, workflow_dir)
 23 | 	return mcp_app
 24 | 
 25 | 
 26 | def _setup_workflow_tools(
 27 | 	mcp_app: FastMCP, llm_instance: BaseChatModel, page_extraction_llm: BaseChatModel | None, workflow_dir: str
 28 | ):
 29 | 	"""
 30 | 	Scans a directory for workflow.json files, loads them, and registers them as tools
 31 | 	with the FastMCP instance by dynamically setting function signatures.
 32 | 	"""
 33 | 	workflow_files = list(Path(workflow_dir).glob('*.workflow.json'))
 34 | 	print(f"[FastMCP Service] Found workflow files in '{workflow_dir}': {len(workflow_files)}")
 35 | 
 36 | 	for wf_file_path in workflow_files:
 37 | 		try:
 38 | 			print(f'[FastMCP Service] Loading workflow from: {wf_file_path}')
 39 | 			schema = WorkflowDefinitionSchema.load_from_json(str(wf_file_path))
 40 | 
 41 | 			# Instantiate the workflow
 42 | 			workflow = Workflow(
 43 | 				workflow_schema=schema, llm=llm_instance, page_extraction_llm=page_extraction_llm, browser=None, controller=None
 44 | 			)
 45 | 
 46 | 			params_for_signature = []
 47 | 			annotations_for_runner = {}
 48 | 
 49 | 			if hasattr(workflow._input_model, 'model_fields'):
 50 | 				for field_name, model_field in workflow._input_model.model_fields.items():
 51 | 					param_annotation = model_field.annotation if model_field.annotation is not None else Any
 52 | 
 53 | 					param_default = Parameter.empty
 54 | 					if not model_field.is_required():
 55 | 						param_default = model_field.default if model_field.default is not None else None
 56 | 
 57 | 					params_for_signature.append(
 58 | 						Parameter(
 59 | 							name=field_name,
 60 | 							kind=Parameter.POSITIONAL_OR_KEYWORD,
 61 | 							default=param_default,
 62 | 							annotation=param_annotation,
 63 | 						)
 64 | 					)
 65 | 					annotations_for_runner[field_name] = param_annotation
 66 | 
 67 | 			dynamic_signature = Signature(params_for_signature)
 68 | 
 69 | 			# Sanitize workflow name for the function name
 70 | 			safe_workflow_name_for_func = ''.join(c if c.isalnum() else '_' for c in schema.name)
 71 | 			dynamic_func_name = f'tool_runner_{safe_workflow_name_for_func}_{schema.version.replace(".", "_")}'
 72 | 
 73 | 			# Define the actual function that will be called by FastMCP
 74 | 			# It uses a closure to capture the specific 'workflow' instance
 75 | 			def create_runner(wf_instance: Workflow):
 76 | 				async def actual_workflow_runner(**kwargs):
 77 | 					# kwargs will be populated by FastMCP based on the dynamic_signature
 78 | 					raw_result = await wf_instance.run(inputs=kwargs)
 79 | 					try:
 80 | 						return _json.dumps(raw_result, default=str)
 81 | 					except Exception:
 82 | 						return str(raw_result)
 83 | 
 84 | 				return actual_workflow_runner
 85 | 
 86 | 			runner_func_impl = create_runner(workflow)
 87 | 
 88 | 			# Set the dunder attributes that FastMCP will inspect
 89 | 			runner_func_impl.__name__ = dynamic_func_name
 90 | 			runner_func_impl.__doc__ = schema.description
 91 | 			runner_func_impl.__signature__ = dynamic_signature
 92 | 			runner_func_impl.__annotations__ = annotations_for_runner
 93 | 
 94 | 			# Tool name and description for FastMCP registration
 95 | 			unique_tool_name = f'{schema.name.replace(" ", "_")}_{schema.version}'
 96 | 			tool_description = schema.description
 97 | 
 98 | 			tool_decorator = mcp_app.tool(name=unique_tool_name, description=tool_description)
 99 | 			tool_decorator(runner_func_impl)
100 | 
101 | 			param_names_for_log = list(dynamic_signature.parameters.keys())
102 | 			print(
103 | 				f"[FastMCP Service] Registered tool (via signature): '{unique_tool_name}' for '{schema.name}'. Params: {param_names_for_log}"
104 | 			)
105 | 
106 | 		except Exception as e:
107 | 			print(f'[FastMCP Service] Failed to load or register workflow from {wf_file_path}: {e}')
108 | 			import traceback
109 | 
110 | 			traceback.print_exc()
111 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/mcp/tests/test_tools.py:
--------------------------------------------------------------------------------
 1 | from langchain_openai import ChatOpenAI
 2 | 
 3 | from workflow_use.mcp.service import get_mcp_server
 4 | 
 5 | # async def main():
 6 | if __name__ == '__main__':
 7 | 	llm_instance = ChatOpenAI(model='gpt-4o', temperature=0)
 8 | 
 9 | 	print('[FastMCP Server] Starting MCP server...')
10 | 	# This will run the FastMCP server, typically using stdio transport by default.
11 | 	# For CLI execution like `fastmcp run workflow_use.mcp.server:mcp_app`,
12 | 	# this __main__ block might be bypassed by FastMCP's runner,
13 | 	# but it's good practice for direct Python execution.
14 | 	mcp = get_mcp_server(llm_instance, workflow_dir='./tmp')
15 | 	mcp.run(
16 | 		transport='sse',
17 | 		host='0.0.0.0',
18 | 		port=8008,
19 | 	)
20 | 
21 | 	# async with Client(mcp) as client:
22 | 	# 	tools = await client.list_tools()
23 | 	# 	print(f'Available tools: {tools}')
24 | 
25 | 	# 	result = await client.call_tool(
26 | 	# 		'Government_Form_Submission_1.0',
27 | 	# 		{
28 | 	# 			'first_name': 'John',
29 | 	# 			'last_name': 'Smith',
30 | 	# 			'social_security_last4': '1234',
31 | 	# 			'gender': 'male',
32 | 	# 			'marital_status': 'single',
33 | 	# 		},
34 | 	# 	)
35 | 
36 | 	# 	print(result)
37 | 
38 | 
39 | # if __name__ == '__main__':
40 | # 	asyncio.run(main())
41 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/recorder/recorder.py:
--------------------------------------------------------------------------------
 1 | # Example for your new main runner (e.g., in recorder.py or a new script)
 2 | import asyncio
 3 | 
 4 | from workflow_use.recorder.service import RecordingService  # Adjust import path if necessary
 5 | 
 6 | 
 7 | async def run_recording():
 8 | 	service = RecordingService()
 9 | 	print('Starting recording session via service...')
10 | 	workflow_schema = await service.capture_workflow()
11 | 
12 | 	if workflow_schema:
13 | 		print('\n--- MAIN SCRIPT: CAPTURED WORKFLOW ---')
14 | 		try:
15 | 			print(workflow_schema.model_dump_json(indent=2))
16 | 		except AttributeError:
17 | 			# Fallback if model_dump_json isn't available (e.g. if it's a dict)
18 | 			import json
19 | 
20 | 			print(json.dumps(workflow_schema, indent=2))  # Ensure schema is serializable
21 | 		print('------------------------------------')
22 | 	else:
23 | 		print('MAIN SCRIPT: No workflow was captured.')
24 | 
25 | 
26 | if __name__ == '__main__':
27 | 	try:
28 | 		asyncio.run(run_recording())
29 | 	except KeyboardInterrupt:
30 | 		print('Main recording script interrupted.')
31 | 	except Exception as e:
32 | 		print(f'An error occurred in the main recording script: {e}')
33 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/recorder/service.py:
--------------------------------------------------------------------------------
  1 | import asyncio
  2 | import json
  3 | import pathlib
  4 | from typing import Optional
  5 | 
  6 | import uvicorn
  7 | from browser_use import Browser
  8 | from browser_use.browser.profile import BrowserProfile
  9 | from fastapi import FastAPI
 10 | from patchright.async_api import async_playwright as patchright_async_playwright
 11 | 
 12 | # Assuming views.py is correctly located for this import path
 13 | from workflow_use.recorder.views import (
 14 | 	HttpRecordingStoppedEvent,
 15 | 	HttpWorkflowUpdateEvent,
 16 | 	RecorderEvent,
 17 | 	WorkflowDefinitionSchema,  # This is the expected output type
 18 | )
 19 | 
 20 | # Path Configuration (should be identical to recorder.py if run from the same context)
 21 | SCRIPT_DIR = pathlib.Path(__file__).resolve().parent
 22 | EXT_DIR = SCRIPT_DIR.parent.parent.parent / 'extension' / '.output' / 'chrome-mv3'
 23 | USER_DATA_DIR = SCRIPT_DIR / 'user_data_dir'
 24 | 
 25 | 
 26 | class RecordingService:
 27 | 	def __init__(self):
 28 | 		self.event_queue: asyncio.Queue[RecorderEvent] = asyncio.Queue()
 29 | 		self.last_workflow_update_event: Optional[HttpWorkflowUpdateEvent] = None
 30 | 		self.browser: Browser
 31 | 
 32 | 		self.final_workflow_output: Optional[WorkflowDefinitionSchema] = None
 33 | 		self.recording_complete_event = asyncio.Event()
 34 | 		self.final_workflow_processed_lock = asyncio.Lock()
 35 | 		self.final_workflow_processed_flag = False
 36 | 
 37 | 		self.app = FastAPI(title='Temporary Recording Event Server')
 38 | 		self.app.add_api_route('/event', self._handle_event_post, methods=['POST'], status_code=202)
 39 | 		# -- DEBUGGING --
 40 | 		# Turn this on to debug requests
 41 | 		# @self.app.middleware("http")
 42 | 		# async def log_requests(request: Request, call_next):
 43 | 		#     print(f"[Debug] Incoming request: {request.method} {request.url}")
 44 | 		#     try:
 45 | 		#         # Read request body
 46 | 		#         body = await request.body()
 47 | 		#         print(f"[Debug] Request body: {body.decode('utf-8', errors='replace')}")
 48 | 		#         response = await call_next(request)
 49 | 		#         print(f"[Debug] Response status: {response.status_code}")
 50 | 		#         return response
 51 | 		#     except Exception as e:
 52 | 		#         print(f"[Error] Error processing request: {str(e)}")
 53 | 
 54 | 		self.uvicorn_server_instance: Optional[uvicorn.Server] = None
 55 | 		self.server_task: Optional[asyncio.Task] = None
 56 | 		self.browser_task: Optional[asyncio.Task] = None
 57 | 		self.event_processor_task: Optional[asyncio.Task] = None
 58 | 
 59 | 	async def _handle_event_post(self, event_data: RecorderEvent):
 60 | 		if isinstance(event_data, HttpWorkflowUpdateEvent):
 61 | 			self.last_workflow_update_event = event_data
 62 | 		await self.event_queue.put(event_data)
 63 | 		return {'status': 'accepted', 'message': 'Event queued for processing'}
 64 | 
 65 | 	async def _process_event_queue(self):
 66 | 		print('[Service] Event processing task started.')
 67 | 		try:
 68 | 			while True:
 69 | 				event = await self.event_queue.get()
 70 | 				print(f'[Service] Event Received: {event.type}')
 71 | 				if isinstance(event, HttpWorkflowUpdateEvent):
 72 | 					# self.last_workflow_update_event is already updated in _handle_event_post
 73 | 					pass
 74 | 				elif isinstance(event, HttpRecordingStoppedEvent):
 75 | 					print('[Service] RecordingStoppedEvent received, processing final workflow...')
 76 | 					await self._capture_and_signal_final_workflow('RecordingStoppedEvent')
 77 | 				self.event_queue.task_done()
 78 | 		except asyncio.CancelledError:
 79 | 			print('[Service] Event processing task cancelled.')
 80 | 		except Exception as e:
 81 | 			print(f'[Service] Error in event processing task: {e}')
 82 | 
 83 | 	async def _capture_and_signal_final_workflow(self, trigger_reason: str):
 84 | 		processed_this_call = False
 85 | 		async with self.final_workflow_processed_lock:
 86 | 			if not self.final_workflow_processed_flag and self.last_workflow_update_event:
 87 | 				print(f'[Service] Capturing final workflow (Trigger: {trigger_reason}).')
 88 | 				self.final_workflow_output = self.last_workflow_update_event.payload
 89 | 				self.final_workflow_processed_flag = True
 90 | 				processed_this_call = True
 91 | 
 92 | 		if processed_this_call:
 93 | 			print('[Service] Final workflow captured. Setting recording_complete_event.')
 94 | 			self.recording_complete_event.set()  # Signal completion to the main method
 95 | 
 96 | 			# If processing was due to RecordingStoppedEvent, also try to close the browser
 97 | 			if trigger_reason == 'RecordingStoppedEvent' and self.browser:
 98 | 				print('[Service] Attempting to close browser due to RecordingStoppedEvent...')
 99 | 				try:
100 | 					await self.browser.close()
101 | 					print('[Service] Browser close command issued.')
102 | 				except Exception as e_close:
103 | 					print(f'[Service] Error closing browser on recording stop: {e_close}')
104 | 
105 | 	async def _launch_browser_and_wait(self):
106 | 		print(f'[Service] Attempting to load extension from: {EXT_DIR}')
107 | 		if not EXT_DIR.exists() or not EXT_DIR.is_dir():
108 | 			print(f'[Service] ERROR: Extension directory not found: {EXT_DIR}')
109 | 			self.recording_complete_event.set()  # Signal failure
110 | 			return
111 | 
112 | 		# Ensure user data dir exists
113 | 		USER_DATA_DIR.mkdir(parents=True, exist_ok=True)
114 | 		print(f'[Service] Using browser user data directory: {USER_DATA_DIR}')
115 | 
116 | 		try:
117 | 			# Create browser profile with extension support
118 | 			profile = BrowserProfile(
119 | 				headless=False,
120 | 				user_data_dir=str(USER_DATA_DIR.resolve()),
121 | 				args=[
122 | 					f'--disable-extensions-except={str(EXT_DIR.resolve())}',
123 | 					f'--load-extension={str(EXT_DIR.resolve())}',
124 | 					'--no-default-browser-check',
125 | 					'--no-first-run',
126 | 				],
127 | 				keep_alive=True,
128 | 			)
129 | 
130 | 			# Create and configure browser
131 | 			playwright = await patchright_async_playwright().start()
132 | 			self.browser = Browser(browser_profile=profile, playwright=playwright)
133 | 
134 | 			print('[Service] Starting browser with extensions...')
135 | 			await self.browser.start()
136 | 
137 | 			print('[Service] Browser launched. Waiting for close or recording stop...')
138 | 
139 | 			# Wait for browser to be closed manually or recording to stop
140 | 			# We'll implement a simple polling mechanism to check if browser is still running
141 | 			while True:
142 | 				try:
143 | 					# Check if browser is still running by trying to get current page
144 | 					await self.browser.get_current_page()
145 | 					await asyncio.sleep(1)  # Poll every second
146 | 				except Exception:
147 | 					# Browser is likely closed
148 | 					print('[Service] Browser appears to be closed or inaccessible.')
149 | 					break
150 | 
151 | 		except asyncio.CancelledError:
152 | 			print('[Service] Browser task cancelled.')
153 | 			if self.browser:
154 | 				try:
155 | 					await self.browser.close()
156 | 				except:
157 | 					pass  # Best effort
158 | 			raise  # Re-raise to be caught by gather
159 | 		except Exception as e:
160 | 			print(f'[Service] Error in browser task: {e}')
161 | 		finally:
162 | 			print('[Service] Browser task finalization.')
163 | 			# self.browser = None
164 | 			# This call ensures that if browser is closed manually, we still try to capture.
165 | 			await self._capture_and_signal_final_workflow('BrowserTaskEnded')
166 | 
167 | 	async def capture_workflow(self) -> Optional[WorkflowDefinitionSchema]:
168 | 		print('[Service] Starting capture_workflow session...')
169 | 		# Reset state for this session
170 | 		self.last_workflow_update_event = None
171 | 		self.final_workflow_output = None
172 | 		self.recording_complete_event.clear()
173 | 		self.final_workflow_processed_flag = False
174 | 
175 | 		# Start background tasks
176 | 		self.event_processor_task = asyncio.create_task(self._process_event_queue())
177 | 		self.browser_task = asyncio.create_task(self._launch_browser_and_wait())
178 | 
179 | 		# Configure and start Uvicorn server
180 | 		config = uvicorn.Config(self.app, host='127.0.0.1', port=7331, log_level='warning', loop='asyncio')
181 | 		self.uvicorn_server_instance = uvicorn.Server(config)
182 | 		self.server_task = asyncio.create_task(self.uvicorn_server_instance.serve())
183 | 		print('[Service] Uvicorn server task started.')
184 | 
185 | 		try:
186 | 			print('[Service] Waiting for recording to complete...')
187 | 			await self.recording_complete_event.wait()
188 | 			print('[Service] Recording complete event received. Proceeding to cleanup.')
189 | 		except asyncio.CancelledError:
190 | 			print('[Service] capture_workflow task was cancelled externally.')
191 | 		finally:
192 | 			print('[Service] Starting cleanup phase...')
193 | 
194 | 			# 1. Stop Uvicorn server
195 | 			if self.uvicorn_server_instance and self.server_task and not self.server_task.done():
196 | 				print('[Service] Signaling Uvicorn server to shut down...')
197 | 				self.uvicorn_server_instance.should_exit = True
198 | 				try:
199 | 					await asyncio.wait_for(self.server_task, timeout=5)  # Give server time to shut down
200 | 				except asyncio.TimeoutError:
201 | 					print('[Service] Uvicorn server shutdown timed out. Cancelling task.')
202 | 					self.server_task.cancel()
203 | 				except asyncio.CancelledError:  # If capture_workflow itself was cancelled
204 | 					pass
205 | 				except Exception as e_server_shutdown:
206 | 					print(f'[Service] Error during Uvicorn server shutdown: {e_server_shutdown}')
207 | 
208 | 			# 2. Stop browser task (and ensure browser is closed)
209 | 			if self.browser_task and not self.browser_task.done():
210 | 				print('[Service] Cancelling browser task...')
211 | 				self.browser_task.cancel()
212 | 				try:
213 | 					await self.browser_task
214 | 				except asyncio.CancelledError:
215 | 					pass
216 | 				except Exception as e_browser_cancel:
217 | 					print(f'[Service] Error awaiting cancelled browser task: {e_browser_cancel}')
218 | 
219 | 			if self.browser:  # Final check to close browser if still open
220 | 				print('[Service] Ensuring browser is closed in cleanup...')
221 | 				try:
222 | 					self.browser.browser_profile.keep_alive = False
223 | 					await self.browser.close()
224 | 				except Exception as e_browser_close:
225 | 					print(f'[Service] Error closing browser in final cleanup: {e_browser_close}')
226 | 				# self.browser = None
227 | 
228 | 			# 3. Stop event processor task
229 | 			if self.event_processor_task and not self.event_processor_task.done():
230 | 				print('[Service] Cancelling event processor task...')
231 | 				self.event_processor_task.cancel()
232 | 				try:
233 | 					await self.event_processor_task
234 | 				except asyncio.CancelledError:
235 | 					pass
236 | 				except Exception as e_ep_cancel:
237 | 					print(f'[Service] Error awaiting cancelled event processor task: {e_ep_cancel}')
238 | 
239 | 			print('[Service] Cleanup phase complete.')
240 | 
241 | 		if self.final_workflow_output:
242 | 			print('[Service] Returning captured workflow.')
243 | 		else:
244 | 			print('[Service] No workflow captured or an error occurred.')
245 | 		return self.final_workflow_output
246 | 
247 | 
248 | async def main_service_runner():  # Example of how to run the service
249 | 	service = RecordingService()
250 | 	workflow_data = await service.capture_workflow()
251 | 	if workflow_data:
252 | 		print('\n--- CAPTURED WORKFLOW DATA (from main_service_runner) ---')
253 | 		# Assuming WorkflowDefinitionSchema has model_dump_json or similar
254 | 		try:
255 | 			print(workflow_data.model_dump_json(indent=2))
256 | 		except AttributeError:
257 | 			print(json.dumps(workflow_data, indent=2))  # Fallback for plain dicts if model_dump_json not present
258 | 		print('-----------------------------------------------------')
259 | 	else:
260 | 		print('No workflow data was captured by the service.')
261 | 
262 | 
263 | if __name__ == '__main__':
264 | 	# This allows running service.py directly for testing
265 | 	try:
266 | 		asyncio.run(main_service_runner())
267 | 	except KeyboardInterrupt:
268 | 		print('Service runner interrupted by user.')
269 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/recorder/views.py:
--------------------------------------------------------------------------------
 1 | from typing import Literal, Union
 2 | 
 3 | from pydantic import BaseModel
 4 | 
 5 | from workflow_use.schema.views import WorkflowDefinitionSchema
 6 | 
 7 | # --- Event Payloads ---
 8 | 
 9 | 
10 | class RecordingStatusPayload(BaseModel):
11 | 	message: str
12 | 
13 | 
14 | # --- Main Event Models (mirroring HttpEvent types from message-bus-types.ts) ---
15 | 
16 | 
17 | class BaseHttpEvent(BaseModel):
18 | 	timestamp: int
19 | 
20 | 
21 | class HttpWorkflowUpdateEvent(BaseHttpEvent):
22 | 	type: Literal['WORKFLOW_UPDATE'] = 'WORKFLOW_UPDATE'
23 | 	payload: WorkflowDefinitionSchema
24 | 
25 | 
26 | class HttpRecordingStartedEvent(BaseHttpEvent):
27 | 	type: Literal['RECORDING_STARTED'] = 'RECORDING_STARTED'
28 | 	payload: RecordingStatusPayload
29 | 
30 | 
31 | class HttpRecordingStoppedEvent(BaseHttpEvent):
32 | 	type: Literal['RECORDING_STOPPED'] = 'RECORDING_STOPPED'
33 | 	payload: RecordingStatusPayload
34 | 
35 | 
36 | # Union of all possible event types received by the recorder
37 | RecorderEvent = Union[
38 | 	HttpWorkflowUpdateEvent,
39 | 	HttpRecordingStartedEvent,
40 | 	HttpRecordingStoppedEvent,
41 | ]
42 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/schema/views.py:
--------------------------------------------------------------------------------
  1 | from typing import List, Literal, Optional, Union
  2 | 
  3 | from pydantic import BaseModel, Field
  4 | 
  5 | 
  6 | # --- Base Step Model ---
  7 | # Common fields for all step types
  8 | class BaseWorkflowStep(BaseModel):
  9 | 	description: Optional[str] = Field(None, description="Optional description/comment about the step's purpose.")
 10 | 	output: Optional[str] = Field(None, description='Context key to store step output under.')
 11 | 	# Allow other fields captured from raw events but not explicitly modeled
 12 | 	model_config = {'extra': 'allow'}
 13 | 
 14 | 
 15 | # --- Timestamped Step Mixin (for deterministic actions) ---
 16 | class TimestampedWorkflowStep(BaseWorkflowStep):
 17 | 	timestamp: Optional[int] = Field(None, description='Timestamp from recording (informational).')
 18 | 	tabId: Optional[int] = Field(None, description='Browser tab ID from recording (informational).')
 19 | 
 20 | 
 21 | # --- Agent Step ---
 22 | class AgentTaskWorkflowStep(BaseWorkflowStep):
 23 | 	type: Literal['agent']
 24 | 	task: str = Field(..., description='The objective or task description for the agent.')
 25 | 	max_steps: Optional[int] = Field(
 26 | 		None,
 27 | 		description='Maximum number of iterations for the agent (default handled in code).',
 28 | 	)
 29 | 	# Agent steps might also have 'params' for other configs, handled by extra='allow'
 30 | 
 31 | 
 32 | # --- Deterministic Action Steps (based on controllers and examples) ---
 33 | 
 34 | 
 35 | # Actions from src/workflows/controller/service.py & Examples
 36 | class NavigationStep(TimestampedWorkflowStep):
 37 | 	"""Navigates using the 'navigation' action (likely maps to go_to_url)."""
 38 | 
 39 | 	type: Literal['navigation']  # As seen in examples
 40 | 	url: str = Field(..., description='Target URL to navigate to. Can use {context_var}.')
 41 | 
 42 | 
 43 | class ClickStep(TimestampedWorkflowStep):
 44 | 	"""Clicks an element using 'click' (maps to workflow controller's click)."""
 45 | 
 46 | 	type: Literal['click']  # As seen in examples
 47 | 	cssSelector: str = Field(..., description='CSS selector for the target element.')
 48 | 	xpath: Optional[str] = Field(None, description='XPath selector (often informational).')
 49 | 	elementTag: Optional[str] = Field(None, description='HTML tag (informational).')
 50 | 	elementText: Optional[str] = Field(None, description='Element text (informational).')
 51 | 
 52 | 
 53 | class InputStep(TimestampedWorkflowStep):
 54 | 	"""Inputs text using 'input' (maps to workflow controller's input)."""
 55 | 
 56 | 	type: Literal['input']  # As seen in examples
 57 | 	cssSelector: str = Field(..., description='CSS selector for the target input element.')
 58 | 	value: str = Field(..., description='Value to input. Can use {context_var}.')
 59 | 	xpath: Optional[str] = Field(None, description='XPath selector (informational).')
 60 | 	elementTag: Optional[str] = Field(None, description='HTML tag (informational).')
 61 | 
 62 | 
 63 | class SelectChangeStep(TimestampedWorkflowStep):
 64 | 	"""Selects a dropdown option using 'select_change' (maps to workflow controller's select_change)."""
 65 | 
 66 | 	type: Literal['select_change']  # Assumed type for workflow controller's select_change
 67 | 	cssSelector: str = Field(..., description='CSS selector for the target select element.')
 68 | 	selectedText: str = Field(..., description='Visible text of the option to select. Can use {context_var}.')
 69 | 	xpath: Optional[str] = Field(None, description='XPath selector (informational).')
 70 | 	elementTag: Optional[str] = Field(None, description='HTML tag (informational).')
 71 | 
 72 | 
 73 | class KeyPressStep(TimestampedWorkflowStep):
 74 | 	"""Presses a key using 'key_press' (maps to workflow controller's key_press)."""
 75 | 
 76 | 	type: Literal['key_press']  # As seen in examples
 77 | 	cssSelector: str = Field(..., description='CSS selector for the target element.')
 78 | 	key: str = Field(..., description="The key to press (e.g., 'Tab', 'Enter').")
 79 | 	xpath: Optional[str] = Field(None, description='XPath selector (informational).')
 80 | 	elementTag: Optional[str] = Field(None, description='HTML tag (informational).')
 81 | 
 82 | 
 83 | class ScrollStep(TimestampedWorkflowStep):
 84 | 	"""Scrolls the page using 'scroll' (maps to workflow controller's scroll)."""
 85 | 
 86 | 	type: Literal['scroll']  # Assumed type for workflow controller's scroll
 87 | 	scrollX: int = Field(..., description='Horizontal scroll pixels.')
 88 | 	scrollY: int = Field(..., description='Vertical scroll pixels.')
 89 | 
 90 | 
 91 | class PageExtractionStep(TimestampedWorkflowStep):
 92 | 	"""Extracts text from the page using 'page_extraction' (maps to workflow controller's page_extraction)."""
 93 | 
 94 | 	type: Literal['extract_page_content']  # Assumed type for workflow controller's page_extraction
 95 | 	goal: str = Field(..., description='The goal of the page extraction.')
 96 | 
 97 | 
 98 | # --- Union of all possible step types ---
 99 | # This Union defines what constitutes a valid step in the "steps" list.
100 | DeterministicWorkflowStep = Union[
101 | 	NavigationStep,
102 | 	ClickStep,
103 | 	InputStep,
104 | 	SelectChangeStep,
105 | 	KeyPressStep,
106 | 	ScrollStep,
107 | 	PageExtractionStep,
108 | ]
109 | 
110 | AgenticWorkflowStep = AgentTaskWorkflowStep
111 | 
112 | 
113 | WorkflowStep = Union[
114 | 	# Pure workflow
115 | 	DeterministicWorkflowStep,
116 | 	# Agentic
117 | 	AgenticWorkflowStep,
118 | ]
119 | 
120 | allowed_controller_actions = []
121 | 
122 | 
123 | # --- Input Schema Definition ---
124 | # (Remains the same)
125 | class WorkflowInputSchemaDefinition(BaseModel):
126 | 	name: str = Field(
127 | 		...,
128 | 		description='The name of the property. This will be used as the key in the input schema.',
129 | 	)
130 | 	type: Literal['string', 'number', 'bool']
131 | 	required: Optional[bool] = Field(
132 | 		default=None,
133 | 		description='None if the property is optional, True if the property is required.',
134 | 	)
135 | 
136 | 
137 | # --- Top-Level Workflow Definition File ---
138 | # Uses the Union WorkflowStep type
139 | 
140 | 
141 | class WorkflowDefinitionSchema(BaseModel):
142 | 	"""Pydantic model representing the structure of the workflow JSON file."""
143 | 
144 | 	workflow_analysis: Optional[str] = Field(
145 | 		None,
146 | 		description='A chain of thought reasoning analysis of the original workflow recording.',
147 | 	)
148 | 
149 | 	name: str = Field(..., description='The name of the workflow.')
150 | 	description: str = Field(..., description='A human-readable description of the workflow.')
151 | 	version: str = Field(..., description='The version identifier for this workflow definition.')
152 | 	steps: List[WorkflowStep] = Field(
153 | 		...,
154 | 		min_length=1,
155 | 		description='An ordered list of steps (actions or agent tasks) to be executed.',
156 | 	)
157 | 	input_schema: list[WorkflowInputSchemaDefinition] = Field(
158 | 		# default=WorkflowInputSchemaDefinition(),
159 | 		description='List of input schema definitions.',
160 | 	)
161 | 
162 | 	# Add loader from json file
163 | 	@classmethod
164 | 	def load_from_json(cls, json_path: str):
165 | 		with open(json_path, 'r') as f:
166 | 			return cls.model_validate_json(f.read())
167 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/workflow/prompts.py:
--------------------------------------------------------------------------------
 1 | WORKFLOW_FALLBACK_PROMPT_TEMPLATE = (
 2 | 	'While executing step {step_index}/{total_steps} in the workflow:\n\n'
 3 | 	# "{workflow_details}\n\n"
 4 | 	"The deterministic action '{action_type}' failed with the following context:\n"
 5 | 	'{fail_details}\n\n'
 6 | 	'The intended target or expected value for this step was: {failed_value}\n\n'
 7 | 	'IMPORTANT: Your task is to ONLY complete this specific step ({step_index}) and nothing more. '
 8 | 	"The step's purpose is described as: '{step_description}'.\n"
 9 | 	'Do not retry the same action that failed. Instead, choose a different suitable action(s) to accomplish the same goal. '
10 | 	'For example, if a click failed, consider navigating to a URL, inputting text, or selecting an option. '
11 | 	'However, ONLY perform the minimum action needed to complete this specific step. '
12 | 	'If the step requires clicking a button, ONLY click that button. If it requires navigation, ONLY navigate. '
13 | 	'Do not perform any additional actions beyond what is strictly necessary for this step. '
14 | 	'Once the objective of step {step_index} is reached, call the Done action to complete the step. '
15 | 	'Do not proceed to the next step or perform any actions beyond this specific step.'
16 | )
17 | 
18 | STRUCTURED_OUTPUT_PROMPT = """
19 | You are a data extraction expert. Your task is to extract structured information from the provided content.
20 | 
21 | The content may contain various pieces of information from different sources. You need to analyze this content and extract the relevant information according to the output schema provided below.
22 | 
23 | Only extract information that is explicitly present in the content. Be precise and follow the schema exactly.
24 | """
25 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/workflow/tests/run_workflow.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | # Ensure langchain-openai is installed and OPENAI_API_KEY is set
 5 | from langchain_openai import ChatOpenAI
 6 | 
 7 | from workflow_use.builder.service import BuilderService
 8 | from workflow_use.workflow.service import Workflow
 9 | 
10 | # Instantiate the LLM and the service directly
11 | llm_instance = ChatOpenAI(model='gpt-4o')  # Or your preferred model
12 | builder_service = BuilderService(llm=llm_instance)
13 | 
14 | 
15 | async def test_run_workflow():
16 | 	"""
17 | 	Tests that the workflow is built correctly from a JSON file path.
18 | 	"""
19 | 	path = Path(__file__).parent / 'tmp' / 'recording.workflow.json'
20 | 
21 | 	workflow = Workflow.load_from_file(path)
22 | 	result = await workflow.run({'model': '12'})
23 | 	print(result)
24 | 
25 | 
26 | if __name__ == '__main__':
27 | 	asyncio.run(test_run_workflow())
28 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/workflow/tests/test_extract.py:
--------------------------------------------------------------------------------
 1 | import asyncio
 2 | from pathlib import Path
 3 | 
 4 | # Ensure langchain-openai is installed and OPENAI_API_KEY is set
 5 | from langchain_openai import ChatOpenAI
 6 | from pydantic import BaseModel
 7 | 
 8 | from workflow_use.workflow.service import Workflow
 9 | 
10 | # Instantiate the LLM and the service directly
11 | llm_instance = ChatOpenAI(model='gpt-4o')  # Or your preferred model
12 | page_extraction_llm = ChatOpenAI(model='gpt-4o-mini')
13 | 
14 | 
15 | class OutputModel(BaseModel):
16 | 	api_key: str
17 | 
18 | 
19 | async def test_run_workflow():
20 | 	"""
21 | 	Tests that the workflow is built correctly from a JSON file path.
22 | 	"""
23 | 	path = Path(__file__).parent / 'tmp' / 'extract.workflow.json'
24 | 
25 | 	workflow = Workflow.load_from_file(path, llm=llm_instance, page_extraction_llm=page_extraction_llm)
26 | 
27 | 	result = await workflow.run({'api_key_name': 'test key'}, output_model=OutputModel)
28 | 
29 | 	assert result.output_model is not None
30 | 
31 | 	print(result.output_model.api_key)
32 | 
33 | 
34 | if __name__ == '__main__':
35 | 	asyncio.run(test_run_workflow())
36 | 


--------------------------------------------------------------------------------
/workflows/workflow_use/workflow/views.py:
--------------------------------------------------------------------------------
 1 | from typing import Any, Dict, Generic, List, Optional, TypeVar
 2 | 
 3 | from browser_use.agent.views import ActionResult, AgentHistoryList
 4 | from pydantic import BaseModel, Field
 5 | 
 6 | T = TypeVar('T', bound=BaseModel)
 7 | 
 8 | 
 9 | class WorkflowRunOutput(BaseModel, Generic[T]):
10 | 	"""Output of a workflow run"""
11 | 
12 | 	step_results: List[ActionResult | AgentHistoryList]
13 | 	output_model: Optional[T] = None
14 | 
15 | 
16 | class StructuredWorkflowOutput(BaseModel):
17 | 	"""Base model for structured workflow outputs.
18 | 
19 | 	This can be used as a parent class for custom output models that
20 | 	will be filled by convert_results_to_output_model method.
21 | 	"""
22 | 
23 | 	raw_data: Dict[str, Any] = Field(default_factory=dict, description='Raw extracted data from workflow execution')
24 | 
25 | 	status: str = Field(default='success', description='Overall status of the workflow execution')
26 | 
27 | 	error_message: Optional[str] = Field(default=None, description='Error message if the workflow failed')
28 | 


--------------------------------------------------------------------------------