Hello, Rayrun!

10 | Some text here 11 | 12 |

Deep Nesting Test Page

9 |

10 |

11 |

12 | 13 |

14 |

15 |

16 |

All Attributes Test Page

14 | 15 | Some span 16 |

; 6 | 7 | export type StepOptions = { 8 | debug?: boolean; 9 | model?: string; 10 | openaiApiKey?: string; 11 | openaiBaseUrl?: string; 12 | openaiDefaultQuery?: {}; 13 | openaiDefaultHeaders?: {}; 14 | }; 15 | 16 | export type TaskMessage = { 17 | task: string; 18 | snapshot: { 19 | dom: string; 20 | }; 21 | options?: StepOptions; 22 | }; 23 | 24 | export type TaskResult = { 25 | assertion?: boolean; 26 | query?: string; 27 | errorMessage?: string; 28 | }; 29 | -------------------------------------------------------------------------------- /.github/workflows/release.yaml: -------------------------------------------------------------------------------- 1 | jobs: 2 | release: 3 | runs-on: ubuntu-latest 4 | environment: release 5 | name: Release 6 | steps: 7 | - name: setup repository 8 | uses: actions/checkout@v3 9 | with: 10 | fetch-depth: 0 11 | - name: setup node.js 12 | uses: actions/setup-node@v3 13 | with: 14 | node-version: "21" 15 | - run: npm ci 16 | - run: npm run lint 17 | - run: npm run build 18 | - run: npx semantic-release 19 | env: 20 | GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} 21 | NPM_TOKEN: ${{ secrets.NPM_TOKEN }} 22 | name: release 23 | on: 24 | push: 25 | branches: 26 | - main 27 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2023 Luc Gagan (https://ray.run/) 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. -------------------------------------------------------------------------------- /package.json: -------------------------------------------------------------------------------- 1 | { 2 | "dependencies": { 3 | "@hono/node-server": "1.14.1", 4 | "hono": "4.7.7", 5 | "openai": "4.96.0", 6 | "playwright": "1.52.0", 7 | "sanitize-html": "2.16.0", 8 | "zod": "3.24.3" 9 | }, 10 | "author": { 11 | "name": "Luc Gagan", 12 | "email": "luc@ray.run", 13 | "url": "https://ray.run" 14 | }, 15 | "license": "MIT", 16 | "files": [ 17 | "dist" 18 | ], 19 | "homepage": "https://ray.run", 20 | "keywords": [ 21 | "openai", 22 | "playwright", 23 | "test" 24 | ], 25 | "peerDependencies": { 26 | "@playwright/test": "^1.39.0" 27 | }, 28 | "release": { 29 | "branches": [ 30 | "main" 31 | ] 32 | }, 33 | "name": "auto-playwright", 34 | "main": "./dist/index.js", 35 | "types": "./dist/index.d.ts", 36 | "exports": { 37 | ".": { 38 | "types": "./dist/index.d.ts", 39 | "default": "./dist/index.js" 40 | } 41 | }, 42 | "sideEffects": false, 43 | "description": "Automate Playwright tests using ChatGPT.", 44 | "repository": { 45 | "type": "git", 46 | "url": "https://github.com/lucgagan/auto-playwright" 47 | }, 48 | "devDependencies": { 49 | "@playwright/test": "1.52.0", 50 | "@types/node": "20.17.30", 51 | "@types/sanitize-html": "2.15.0", 52 | "knip": "5.50.5", 53 | "prettier": "3.5.3", 54 | "semantic-release": "24.2.3", 55 | "tsx": "4.19.3", 56 | "typescript": "5.8.3" 57 | }, 58 | "scripts": { 59 | "start": "tsx ./tests/bin/startServer.ts", 60 | "build": "tsc --project tsconfig.build.json", 61 | "format": "prettier --write ./src", 62 | "lint": "prettier --check ./src && knip", 63 | "semantic-release": "semantic-release", 64 | "test": "playwright test" 65 | }, 66 | "version": "0.0.0-development" 67 | } 68 | -------------------------------------------------------------------------------- /src/auto.ts: -------------------------------------------------------------------------------- 1 | import { MAX_TASK_CHARS } from "./config"; 2 | import { type Page, type Test, StepOptions } from "./types"; 3 | import { completeTask } from "./completeTask"; 4 | import { UnimplementedError } from "./errors"; 5 | import { getSnapshot } from "./getSnapshot"; 6 | 7 | export const auto = async ( 8 | task: string, 9 | config: { page: Page; test?: Test }, 10 | options?: StepOptions, 11 | ): Promise => { 12 | if (!config || !config.page) { 13 | throw Error( 14 | "The auto() function is missing the required `{ page }` argument.", 15 | ); 16 | } 17 | 18 | const { test, page } = config as { page: Page; test?: Test }; 19 | 20 | if (!test) { 21 | return await runTask(task, page, options); 22 | } 23 | 24 | return test.step(`auto-playwright.ai '${task}'`, async () => { 25 | const result = await runTask(task, page, options); 26 | 27 | if (result.errorMessage) { 28 | throw new UnimplementedError(result.errorMessage); 29 | } 30 | 31 | if (result.assertion !== undefined) { 32 | return result.assertion; 33 | } 34 | 35 | if (result.query !== undefined) { 36 | return result.query; 37 | } 38 | 39 | return undefined; 40 | }); 41 | }; 42 | 43 | async function runTask( 44 | task: string, 45 | page: Page, 46 | options: StepOptions | undefined, 47 | ) { 48 | if (task.length > MAX_TASK_CHARS) { 49 | throw new Error( 50 | `Provided task string is too long, max length is ${MAX_TASK_CHARS} chars.`, 51 | ); 52 | } 53 | 54 | const result = await completeTask(page, { 55 | task, 56 | snapshot: await getSnapshot(page), 57 | options: options 58 | ? { 59 | model: options.model ?? "gpt-4o", 60 | debug: options.debug ?? false, 61 | openaiApiKey: options.openaiApiKey, 62 | openaiBaseUrl: options.openaiBaseUrl, 63 | openaiDefaultQuery: options.openaiDefaultQuery, 64 | openaiDefaultHeaders: options.openaiDefaultHeaders, 65 | } 66 | : undefined, 67 | }); 68 | return result; 69 | } 70 | -------------------------------------------------------------------------------- /src/sanitizeHtml.ts: -------------------------------------------------------------------------------- 1 | import sanitizeHtmlLibrary = require("sanitize-html"); 2 | 3 | type SanitizeStylesType = 4 | | { [index: string]: { [index: string]: RegExp[] } } 5 | | undefined; 6 | 7 | type SanitizeClassListType = 8 | | { [index: string]: boolean | Array } 9 | | undefined; 10 | 11 | const DEFAULT_SANITIZE_TAGS = sanitizeHtmlLibrary.defaults.allowedTags.concat([ 12 | "body", 13 | "button", 14 | "form", 15 | "img", 16 | "input", 17 | "select", 18 | "textarea", 19 | "option", 20 | ]); 21 | 22 | const DEFAULT_SANITIZE_STYLES: SanitizeStylesType = undefined; 23 | 24 | const DEFAULT_SANITIZE_CLASS_LIST: SanitizeClassListType = undefined; 25 | 26 | export function getSanitizeOptions(): sanitizeHtmlLibrary.IOptions { 27 | return { 28 | // The default allowedTags list already includes _a lot_ of commonly used tags. 29 | // https://www.npmjs.com/package/sanitize-html#default-options 30 | // 31 | // I don't see a need for this to be configurable at the moment, 32 | // as it already covers all the layout tags, but we can revisit this if necessary. 33 | allowedTags: DEFAULT_SANITIZE_TAGS, 34 | // Setting allowedAttributes to false will allow all attributes. 35 | allowedAttributes: false, 36 | allowedClasses: DEFAULT_SANITIZE_CLASS_LIST, 37 | allowedStyles: DEFAULT_SANITIZE_STYLES, 38 | }; 39 | } 40 | 41 | /** 42 | * The reason for sanitization is because OpenAI does not need all of the HTML tags 43 | * to know how to interpret the website, e.g. it will not make a difference to AI if 44 | * we include or exclude 44 | 45 |

46 | Choose a fruit: 47 | 54 |

Selected fruit: None

55 | 62 |

63 |

64 | Choose colors: 65 | 71 |

Selected colors: None

72 | 80 |

81 | 84 | 85 | 93 | 94 |

95 | 96 |

97 | You have reached the bottom of the page! 98 |

99 | 100 | `), 101 | ); 102 | 103 | return new Promise((resolve) => { 104 | const server = serve( 105 | { 106 | fetch: app.fetch, 107 | port, 108 | }, 109 | (info) => { 110 | resolve({ 111 | close: () => { 112 | server.close(); 113 | }, 114 | port: info.port, 115 | }); 116 | }, 117 | ); 118 | }); 119 | }; 120 | 121 | startServer(3000); 122 | -------------------------------------------------------------------------------- /tests/auto.spec.ts: -------------------------------------------------------------------------------- 1 | import { expect, test } from "@playwright/test"; 2 | import { auto } from "../src/auto"; 3 | 4 | const options = undefined; 5 | 6 | test("executes query", async ({ page }) => { 7 | await page.goto("/"); 8 | 9 | const headerText = await auto("get the header text", { page, test }, options); 10 | 11 | expect(headerText).toBe("Hello, Rayrun!"); 12 | }); 13 | 14 | test("executes query using locator_evaluate", async ({ page }) => { 15 | await page.goto("/"); 16 | 17 | const headerText = await auto( 18 | "get the first letter of the header text", 19 | { 20 | page, 21 | test, 22 | }, 23 | options, 24 | ); 25 | 26 | // TODO assert that we are using locator_evaluate to get the first letter 27 | expect(headerText).toBe("H"); 28 | }); 29 | 30 | test("executes action", async ({ page }) => { 31 | await page.goto("/"); 32 | 33 | await auto(`Type "foo" in the search box`, { page, test }, options); 34 | 35 | await page.pause(); 36 | 37 | await expect(page.getByTestId("search-input")).toHaveValue("foo"); 38 | }); 39 | 40 | test("executes click", async ({ page }) => { 41 | await page.goto("/"); 42 | 43 | await auto( 44 | "Click the button until the counter value is equal to 2", 45 | { 46 | page, 47 | test, 48 | }, 49 | options, 50 | ); 51 | 52 | await expect(page.getByTestId("current-count")).toHaveText("2"); 53 | }); 54 | 55 | test("asserts (toBe)", async ({ page }) => { 56 | await page.goto("/"); 57 | 58 | const searchInputHasHeaderText = await auto( 59 | `Is the contents of the header equal to "Hello, Rayrun!"?`, 60 | { page, test }, 61 | options, 62 | ); 63 | 64 | expect(searchInputHasHeaderText).toBe(true); 65 | }); 66 | 67 | test("asserts (not.toBe)", async ({ page }) => { 68 | await page.goto("/"); 69 | 70 | const searchInputHasHeaderText = await auto( 71 | `Is the contents of the header equal to "Flying Donkeys"?`, 72 | { page, test }, 73 | options, 74 | ); 75 | 76 | expect(searchInputHasHeaderText).toBe(false); 77 | }); 78 | 79 | test("executes query, action and assertion", async ({ page }) => { 80 | await page.goto("/"); 81 | 82 | const headerText = await auto("get the header text", { page, test }, options); 83 | 84 | await auto(`type "${headerText}" in the search box`, { page, test }, options); 85 | 86 | const searchInputHasHeaderText = await auto( 87 | `is the contents of the search box equal to "${headerText}"?`, 88 | { page, test }, 89 | options, 90 | ); 91 | 92 | expect(searchInputHasHeaderText).toBe(true); 93 | }); 94 | 95 | test("runs without test parameter", async ({ page }) => { 96 | await page.goto("/"); 97 | 98 | const headerText = await auto("get the header text", { page }, options); 99 | 100 | expect(headerText.query).toBe("Hello, Rayrun!"); 101 | }); 102 | 103 | test("selects an option from dropdown using auto", async ({ page }) => { 104 | await page.goto("/"); 105 | 106 | await auto( 107 | "Select the 'Banana' option from the fruit dropdown", 108 | { page, test }, 109 | options, 110 | ); 111 | 112 | await expect(page.getByTestId("selected-fruit")).toHaveText("Banana"); 113 | }); 114 | 115 | test("selects an option from dropdown by value using auto", async ({ 116 | page, 117 | }) => { 118 | await page.goto("/"); 119 | 120 | await auto( 121 | "Select the option with value 'cherry' from the fruit dropdown", 122 | { page, test }, 123 | options, 124 | ); 125 | 126 | await expect(page.getByTestId("selected-fruit")).toHaveText("Cherry"); 127 | }); 128 | 129 | test("selects multiple options from multi-select using auto", async ({ 130 | page, 131 | }) => { 132 | await page.goto("/"); 133 | 134 | await auto( 135 | "Select the 'Red' and 'Blue' options from the colors multi-select", 136 | { page, test }, 137 | options, 138 | ); 139 | 140 | await expect(page.getByTestId("selected-colors")).toHaveText("Red, Blue"); 141 | }); 142 | 143 | test("extracts visible structure of the page using auto", async ({ page }) => { 144 | test.setTimeout(3 * 60 * 1000); 145 | 146 | await page.goto("/"); 147 | 148 | const structure = await auto( 149 | "Get the visible structure of the page", 150 | { page, test }, 151 | options, 152 | ); 153 | 154 | expect(typeof structure).toBe("string"); 155 | expect(structure.length).toBeGreaterThan(0); 156 | }); 157 | 158 | test("locates elements by ARIA role using auto", async ({ page }) => { 159 | await page.goto("/"); 160 | 161 | await auto( 162 | "Find and click the 'Click me' button using its role", 163 | { page, test }, 164 | options, 165 | ); 166 | 167 | const countText = await page 168 | .locator("[data-testid='current-count']") 169 | .innerText(); 170 | expect(countText).toBe("1"); 171 | }); 172 | 173 | test("locates elements by visible text using auto", async ({ page }) => { 174 | await page.goto("/"); 175 | 176 | await auto( 177 | "Find the fruit dropdown and select the option 'Banana' by visible text", 178 | { page, test }, 179 | options, 180 | ); 181 | 182 | const selectedFruit = await page 183 | .locator("[data-testid='selected-fruit']") 184 | .innerText(); 185 | expect(selectedFruit).toBe("Banana"); 186 | }); 187 | 188 | test("waits for dynamic content to load using auto", async ({ page }) => { 189 | await page.goto("/"); 190 | 191 | await auto( 192 | "Wait for the dynamic content to appear on the page", 193 | { page, test }, 194 | options, 195 | ); 196 | 197 | const dynamicContent = await page.locator("[data-testid='dynamic-content']"); 198 | await expect(dynamicContent).toBeVisible(); 199 | }); 200 | 201 | test("extracts only visible text from a specific element using auto", async ({ 202 | page, 203 | }) => { 204 | await page.goto("/"); 205 | 206 | const extractedText = await auto( 207 | "Extract the visible text from the 'Selected fruit' area", 208 | { page, test }, 209 | options, 210 | ); 211 | 212 | expect(typeof extractedText).toBe("string"); 213 | expect(extractedText.length).toBeGreaterThan(0); 214 | }); 215 | 216 | test("scrolls element into view using auto", async ({ page }) => { 217 | await page.goto("/"); 218 | 219 | await auto( 220 | "Scroll to the bottom of the page where it says 'You have reached the bottom of the page!'", 221 | { 222 | page, 223 | test, 224 | }, 225 | options, 226 | ); 227 | 228 | const isVisible = await page.locator("#bottom-of-page").isVisible(); 229 | expect(isVisible).toBeTruthy(); 230 | }); 231 | 232 | test("waits for network idle state using auto", async ({ page }) => { 233 | await page.goto("/"); 234 | 235 | await auto("Wait until network is idle", { page, test }, options); 236 | 237 | expect(true).toBe(true); 238 | }); 239 | -------------------------------------------------------------------------------- /tests/actions.spec.ts: -------------------------------------------------------------------------------- 1 | import { expect, test } from "@playwright/test"; 2 | import { createActions } from "../src/createActions"; 3 | import { ChatCompletionRunner } from "openai/lib/ChatCompletionRunner"; 4 | import { getSanitizeOptions } from "../src/sanitizeHtml"; 5 | 6 | const runner = {} as ChatCompletionRunner; 7 | 8 | test("finds element using a CSS locator and returns elementId", async ({ 9 | page, 10 | }) => { 11 | await page.goto("/"); 12 | 13 | const actions = createActions(page); 14 | 15 | const result = await actions.locateElement.function( 16 | { 17 | cssSelector: "h1", 18 | }, 19 | runner, 20 | ); 21 | 22 | expect(result).toStrictEqual({ 23 | elementId: expect.any(String), 24 | }); 25 | }); 26 | 27 | test("selects option by value in a select element using elementId", async ({ 28 | page, 29 | }) => { 30 | await page.goto("/"); 31 | 32 | const actions = createActions(page); 33 | 34 | const locateResult = (await actions.locateElement.function( 35 | { 36 | cssSelector: "#fruit-select", 37 | }, 38 | runner, 39 | )) as { elementId: string }; 40 | 41 | const selectResult = await actions.locator_selectOption.function( 42 | { 43 | elementId: locateResult.elementId, 44 | value: "banana", 45 | }, 46 | runner, 47 | ); 48 | 49 | expect(selectResult).toStrictEqual({ 50 | success: true, 51 | }); 52 | 53 | await expect(page.locator("#selected-fruit")).toHaveText("Banana"); 54 | }); 55 | 56 | test("selects option by value in a select element using CSS selector", async ({ 57 | page, 58 | }) => { 59 | await page.goto("/"); 60 | 61 | const actions = createActions(page); 62 | 63 | const selectResult = await actions.locator_selectOption.function( 64 | { 65 | cssSelector: "#fruit-select", 66 | value: "cherry", 67 | }, 68 | runner, 69 | ); 70 | 71 | expect(selectResult).toStrictEqual({ 72 | success: true, 73 | }); 74 | 75 | await expect(page.locator("#selected-fruit")).toHaveText("Cherry"); 76 | }); 77 | 78 | test("selects option by label in a select element using CSS selector", async ({ 79 | page, 80 | }) => { 81 | await page.goto("/"); 82 | 83 | const actions = createActions(page); 84 | 85 | const selectResult = await actions.locator_selectOption.function( 86 | { 87 | cssSelector: "#fruit-select", 88 | label: "Orange", 89 | }, 90 | runner, 91 | ); 92 | 93 | expect(selectResult).toStrictEqual({ 94 | success: true, 95 | }); 96 | 97 | await expect(page.locator("#selected-fruit")).toHaveText("Orange"); 98 | }); 99 | 100 | test("selects option by index in a select element using CSS selector", async ({ 101 | page, 102 | }) => { 103 | await page.goto("/"); 104 | 105 | const actions = createActions(page); 106 | 107 | const selectResult = await actions.locator_selectOption.function( 108 | { 109 | cssSelector: "#fruit-select", 110 | index: 1, 111 | }, 112 | runner, 113 | ); 114 | 115 | expect(selectResult).toStrictEqual({ 116 | success: true, 117 | }); 118 | 119 | await expect(page.locator("#selected-fruit")).toHaveText("Apple"); 120 | }); 121 | 122 | test("selects multiple options in a multiple select element using CSS selector", async ({ 123 | page, 124 | }) => { 125 | await page.goto("/"); 126 | 127 | const actions = createActions(page); 128 | 129 | const selectResult = await actions.locator_selectOption.function( 130 | { 131 | cssSelector: "#colors-select", 132 | value: ["red", "blue"], 133 | }, 134 | runner, 135 | ); 136 | 137 | expect(selectResult).toStrictEqual({ 138 | success: true, 139 | }); 140 | 141 | await expect(page.locator("#selected-colors")).toHaveText("Red, Blue"); 142 | }); 143 | 144 | function createValidationFunction( 145 | allowedTags: string[], 146 | allowedAttributes: any, 147 | maxDepth = 3, 148 | ) { 149 | return function validateNode(node: any, depth = 0) { 150 | expect(node.tag).toBeDefined(); 151 | expect(allowedTags).toContain(node.tag); 152 | 153 | if (allowedAttributes !== false) { 154 | const allowedForAll = allowedAttributes?.["*"]; 155 | const allowedForTag = allowedAttributes?.[node.tag]; 156 | 157 | const isAllowAllForTag = allowedForTag === true; 158 | const isAllowAllGlobal = allowedForAll === true; 159 | 160 | for (const attrName of Object.keys(node.attributes || {})) { 161 | if (!(isAllowAllForTag || isAllowAllGlobal)) { 162 | if (Array.isArray(allowedForTag)) { 163 | expect(allowedForTag).toContain(attrName); 164 | } else if (Array.isArray(allowedForAll)) { 165 | expect(allowedForAll).toContain(attrName); 166 | } else { 167 | throw new Error( 168 | `Attribute ${attrName} is not allowed for tag ${node.tag}`, 169 | ); 170 | } 171 | } 172 | } 173 | } 174 | 175 | if (depth > maxDepth) { 176 | throw new Error(`Depth exceeded maxDepth: ${depth}`); 177 | } 178 | 179 | if (Array.isArray(node.children)) { 180 | for (const child of node.children) { 181 | validateNode(child, depth + 1); 182 | } 183 | } 184 | }; 185 | } 186 | 187 | test("getVisibleStructure on default page", async ({ page }) => { 188 | await page.goto("http://localhost:3000/tests/pages/default.html"); 189 | 190 | const actions = createActions(page); 191 | 192 | const { structure } = (await actions.getVisibleStructure.function( 193 | {}, 194 | runner, 195 | )) as { structure: any }; 196 | 197 | expect(typeof structure).toBe("object"); 198 | expect(structure).not.toBeNull(); 199 | 200 | const sanitizeOptions = getSanitizeOptions(); 201 | const validateNode = createValidationFunction( 202 | sanitizeOptions.allowedTags || [], 203 | sanitizeOptions.allowedAttributes, 204 | ); 205 | 206 | validateNode(structure); 207 | }); 208 | 209 | test("getVisibleStructure on all attributes page", async ({ page }) => { 210 | await page.goto("http://localhost:3000/tests/pages/all-attributes.html"); 211 | 212 | const actions = createActions(page); 213 | 214 | const { structure } = (await actions.getVisibleStructure.function( 215 | {}, 216 | runner, 217 | )) as { structure: any }; 218 | 219 | expect(typeof structure).toBe("object"); 220 | expect(structure).not.toBeNull(); 221 | 222 | const sanitizeOptions = getSanitizeOptions(); 223 | const validateNode = createValidationFunction( 224 | sanitizeOptions.allowedTags || [], 225 | sanitizeOptions.allowedAttributes, 226 | ); 227 | 228 | validateNode(structure); 229 | }); 230 | 231 | test("getVisibleStructure respects max depth", async ({ page }) => { 232 | await page.goto("http://localhost:3000/tests/pages/deep-nesting.html"); 233 | 234 | const actions = createActions(page); 235 | 236 | const { structure } = (await actions.getVisibleStructure.function( 237 | {}, 238 | runner, 239 | )) as { structure: any }; 240 | 241 | expect(typeof structure).toBe("object"); 242 | expect(structure).not.toBeNull(); 243 | 244 | const sanitizeOptions = getSanitizeOptions(); 245 | const validateNode = createValidationFunction( 246 | sanitizeOptions.allowedTags || [], 247 | sanitizeOptions.allowedAttributes, 248 | 5, 249 | ); 250 | 251 | validateNode(structure); 252 | }); 253 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # Auto Playwright 2 | 3 | Run Playwright tests using AI. 4 | 5 | ## Setup 6 | 7 | 1. Install `auto-playwright` dependency: 8 | 9 | ```bash 10 | npm install auto-playwright -D 11 | ``` 12 | 13 | 2. This package relies on talking with OpenAI (https://openai.com/). You must export the API token as an enviroment variable or add it to your `.env` file: 14 | 15 | ```bash 16 | export OPENAI_API_KEY='sk-..." 17 | ``` 18 | 19 | 3. Import and use the `auto` function: 20 | 21 | ```ts 22 | import { test, expect } from "@playwright/test"; 23 | import { auto } from "auto-playwright"; 24 | 25 | test("auto Playwright example", async ({ page }) => { 26 | await page.goto("/"); 27 | 28 | // `auto` can query data 29 | // In this case, the result is plain-text contents of the header 30 | const headerText = await auto("get the header text", { page, test }); 31 | 32 | // `auto` can perform actions 33 | // In this case, auto will find and fill in the search text input 34 | await auto(`Type "${headerText}" in the search box`, { page, test }); 35 | 36 | // `auto` can assert the state of the website 37 | // In this case, the result is a boolean outcome 38 | const searchInputHasHeaderText = await auto( 39 | `Is the contents of the search box equal to "${headerText}"?`, 40 | { page, test }, 41 | ); 42 | 43 | expect(searchInputHasHeaderText).toBe(true); 44 | }); 45 | ``` 46 | 47 | ### Setup with Azure OpenAI 48 | 49 | Include the StepOptions type with the values needed for connecting to Azure OpenAI. 50 | 51 | ```ts 52 | import { test, expect } from "@playwright/test"; 53 | import { auto } from "auto-playwright"; 54 | import { StepOptions } from "../src/types"; 55 | 56 | const apiKey = "apikey"; 57 | const resource = "azure-resource-name"; 58 | const model = "model-deployment-name"; 59 | 60 | const options: StepOptions = { 61 | model: model, 62 | openaiApiKey: apiKey, 63 | openaiBaseUrl: `https://${resource}.openai.azure.com/openai/deployments/${model}`, 64 | openaiDefaultQuery: { "api-version": "2023-07-01-preview" }, 65 | openaiDefaultHeaders: { "api-key": apiKey }, 66 | }; 67 | 68 | test("auto Playwright example", async ({ page }) => { 69 | await page.goto("/"); 70 | 71 | // `auto` can query data 72 | // In this case, the result is plain-text contents of the header 73 | const headerText = await auto("get the header text", { page, test }, options); 74 | 75 | // `auto` can perform actions 76 | // In this case, auto will find and fill in the search text input 77 | await auto(`Type "${headerText}" in the search box`, { page, test }, options); 78 | 79 | // `auto` can assert the state of the website 80 | // In this case, the result is a boolean outcome 81 | const searchInputHasHeaderText = await auto( 82 | `Is the contents of the search box equal to "${headerText}"?`, 83 | { page, test }, 84 | options, 85 | ); 86 | 87 | expect(searchInputHasHeaderText).toBe(true); 88 | }); 89 | ``` 90 | 91 | ## Usage 92 | 93 | At minimum, the `auto` function requires a _plain text prompt_ and an _argument_ that contains your `page` and `test` (optional) objects. 94 | 95 | ```ts 96 | auto("", { page, test }); 97 | ``` 98 | 99 | ### Browser automation 100 | 101 | Running without the `test` parameter: 102 | 103 | ```ts 104 | import { chromium } from "playwright"; 105 | import { auto } from "auto-playwright"; 106 | 107 | (async () => { 108 | const browser = await chromium.launch({ headless: true }); 109 | const context = await browser.newContext(); 110 | const page = await context.newPage(); 111 | // Navigate to a website 112 | await page.goto("https://www.example.com"); 113 | 114 | // `auto` can query data 115 | // In this case, the result is plain-text contents of the header 116 | const res = await auto("get the header text", { page }); 117 | 118 | // use res.query to get a query result. 119 | console.log(res); 120 | await page.close(); 121 | })(); 122 | ``` 123 | 124 | ### Debug 125 | 126 | You may pass a `debug` attribute as the third parameter to the `auto` function. This will print the prompt and the commands executed by OpenAI. 127 | 128 | ```ts 129 | await auto("get the header text", { page, test }, { debug: true }); 130 | ``` 131 | 132 | You may also set environment variable `AUTO_PLAYWRIGHT_DEBUG=true`, which will enable debugging for all `auto` calls. 133 | 134 | ```bash 135 | export AUTO_PLAYWRIGHT_DEBUG=true 136 | ``` 137 | 138 | ## Supported Browsers 139 | 140 | Every browser that Playwright supports. 141 | 142 | ## Additional Options 143 | 144 | There are additional options you can pass as a third argument: 145 | 146 | ```ts 147 | const options = { 148 | // If true, debugging information is printed in the console. 149 | debug: boolean, 150 | // The OpenAI model (https://platform.openai.com/docs/models/overview) 151 | model: "gpt-4-1106-preview", 152 | // The OpenAI API key 153 | openaiApiKey: "sk-...", 154 | }; 155 | 156 | auto("", { page, test }, options); 157 | ``` 158 | 159 | ## Supported Actions & Return Values 160 | 161 | Depending on the `type` of action (inferred by the `auto` function), there are different behaviors and return types. 162 | 163 | ### Action 164 | 165 | An action (e.g. "click") is some simulated user interaction with the page, e.g. a click on a link. Actions will return `undefined`` if they were successful and will throw an error if they failed, e.g. 166 | 167 | ```ts 168 | try { 169 | await auto("click the link", { page, test }); 170 | } catch (e) { 171 | console.error("failed to click the link"); 172 | } 173 | ``` 174 | 175 | ### Query 176 | 177 | A query will return requested data from the page as a string, e.g. 178 | 179 | ```ts 180 | const linkText = await auto("Get the text of the first link", { page, test }); 181 | 182 | console.log("The link text is", linkText); 183 | ``` 184 | 185 | ### Assert 186 | 187 | An assertion is a question that will return `true` or `false`, e.g. 188 | 189 | ```ts 190 | const thereAreThreeLinks = await auto("Are there 3 links on the page?", { 191 | page, 192 | test, 193 | }); 194 | 195 | console.log(`"There are 3 links" is a ${thereAreThreeLinks} statement`); 196 | ``` 197 | 198 | ## Why use Auto Playwright? 199 | 200 | | Aspect | Conventional Approach | Testing with Auto Playwright | 201 | | ------------------------------ | ----------------------------------------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------- | 202 | | **Coupling with Markup** | Strongly linked to the application's markup. | Eliminates the use of selectors; actions are determined by the AI assistant at runtime. | 203 | | **Speed of Implementation** | Slower implementation due to the need for precise code translation for each action. | Rapid test creation using simple, plain text instructions for actions and assertions. | 204 | | **Handling Complex Scenarios** | Automating complex scenarios is challenging and prone to frequent failures. | Facilitates testing of complex scenarios by focusing on the intended test outcomes. | 205 | | **Test Writing Timing** | Can only write tests after the complete development of the functionality. | Enables a Test-Driven Development (TDD) approach, allowing test writing concurrent with or before functionality development. | 206 | 207 | ## Supported Playwright Actions 208 | 209 | - `locator.blur` 210 | - `locator.boundingBox` 211 | - `locator.check` 212 | - `locator.clear` 213 | - `locator.click` 214 | - `locator.count` 215 | - `locator.fill` 216 | - `locator.getAttribute` 217 | - `locator.innerHTML` 218 | - `locator.innerText` 219 | - `locator.inputValue` 220 | - `locator.isChecked` 221 | - `locator.isEditable` 222 | - `locator.isEnabled` 223 | - `locator.isVisible` 224 | - `locator.pressKey` 225 | - `locator.selectOption` 226 | - `locator.textContent` 227 | - `locator.uncheck` 228 | - `page.goto` 229 | - `page.keyboard.press` 230 | 231 | Adding new actions is easy: just update the `functions` in [`src/completeTask.ts`](src/completeTask.ts). 232 | 233 | ## Pricing 234 | 235 | This library is free. However, there are costs associated with using OpenAI. You can find more information about pricing here: https://openai.com/pricing/. 236 | 237 |

238 |

Example

239 | 240 | Using https://ray.run/ as an example, the cost of running a test step is approximately $0.01 using GPT-4 Turbo (and $0.001 using GPT-3.5 Turbo). 241 | 242 | The low cost is in part because `auto-playwright` uses HTML sanitization to reduce the payload size, e.g. What follows is the payload that would be submitted for https://ray.run/. 243 | 244 | Naturally, the price will vary dramatically depending on the payload. 245 | 246 | ```html 247 |

248 |

249 |

250 | Learn Playwright 251 |

252 |

253 | Resources for learning end-to-end testing using Playwright automation 254 | framework 255 |

256 |

259 |

260 |

261 |

Blog

265 |

266 |

Learn in depth subjects about end-to-end testing.

Ask ChatGPT Playwright questions.

All-in-one toolbox for QA engineers.

Handpicked QA and Automation opportunities.

Ask AI answered questions about Playwright.

Archive of Discord Forum posts about Playwright.

Tutorials, conference talks, and release videos.

GUI for generating Playwright locators.

Definitions of common end-to-end testing terms.

323 |

325 |

326 |

329 |

330 | Use ⌘ + 331 | k + "Tools" to quickly access all tools. 332 |

333 |

334 |

335 | ``` 336 | 337 |

338 | 339 | ## Implementation 340 | 341 | ### HTML Sanitization 342 | 343 | The `auto` function uses [sanitize-html](https://www.npmjs.com/package/sanitize-html) to sanitize the HTML of the page before sending it to OpenAI. This is done to reduce cost and improve the quality of the generated text. 344 | 345 | ## ZeroStep 346 | 347 | This project draws its inspiration from [ZeroStep](https://zerostep.com/). ZeroStep offers a similar API but with a more robust implementation through its proprietary backend. Auto Playwright was created with the aim of exploring the underlying technology of ZeroStep and establishing a basis for an open-source version of their software. For production environments, I suggest opting for ZeroStep. 348 | 349 | Here's a side-by-side comparison of Auto Playwright and ZeroStep: 350 | 351 | | Criteria | Auto Playwright | ZeroStep | 352 | | ------------------------------------------------------------------------------------- | --------------- | -------- | 353 | | Uses OpenAI API | Yes | No[^3] | 354 | | Uses plain-text prompts | Yes | No | 355 | | Uses [`functions`](https://www.npmjs.com/package/openai#automated-function-calls) SDK | Yes | No | 356 | | Uses HTML sanitization | Yes | No | 357 | | Uses Playwright API | Yes | No[^4] | 358 | | Uses screenshots | No | Yes | 359 | | Uses queue | No | Yes | 360 | | Uses WebSockets | No | Yes | 361 | | Snapshots | HTML | DOM | 362 | | Implements parallelism | No | Yes | 363 | | Allows scrolling | No | Yes | 364 | | Provides fixtures | No | Yes | 365 | | License | MIT | MIT | 366 | 367 | [^3]: Uses ZeroStep proprietary API. 368 | 369 | [^4]: Uses _some_ Playwright API, but predominantly relies on Chrome DevTools Protocol (CDP). 370 | 371 |

372 |

Zero Step License

373 | 374 | ``` 375 | MIT License 376 | 377 | Copyright (c) 2023 Reflect Software Inc 378 | 379 | Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: 380 | 381 | The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. 382 | 383 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 384 | ``` 385 | 386 |

387 | -------------------------------------------------------------------------------- /src/createActions.ts: -------------------------------------------------------------------------------- 1 | import { Page } from "@playwright/test"; 2 | import { randomUUID } from "crypto"; 3 | import { RunnableFunctionWithParse } from "openai/lib/RunnableFunction"; 4 | import { z } from "zod"; 5 | import { getSanitizeOptions } from "./sanitizeHtml"; 6 | 7 | export const createActions = ( 8 | page: Page, 9 | ): Record> => { 10 | const getLocator = (elementId: string) => { 11 | return page.locator(`[data-element-id="${elementId}"]`); 12 | }; 13 | 14 | return { 15 | locator_pressKey: { 16 | function: async (args: { elementId: string; key: string }) => { 17 | const { elementId, key } = args; 18 | await getLocator(elementId).press(key); 19 | return { success: true }; 20 | }, 21 | name: "locator_pressKey", 22 | description: "Presses a key while focused on the specified element.", 23 | parse: (args: string) => { 24 | return z 25 | .object({ 26 | elementId: z.string(), 27 | key: z.string(), 28 | }) 29 | .parse(JSON.parse(args)); 30 | }, 31 | parameters: { 32 | type: "object", 33 | properties: { 34 | elementId: { type: "string" }, 35 | key: { 36 | type: "string", 37 | description: 38 | "The name of the key to press, e.g., 'Enter', 'ArrowUp', 'a'.", 39 | }, 40 | }, 41 | }, 42 | }, 43 | page_pressKey: { 44 | function: async (args: { elementId: string; key: string }) => { 45 | const { key } = args; 46 | await page.keyboard.press(key); 47 | return { success: true }; 48 | }, 49 | name: "page_pressKey", 50 | description: "Presses a key globally on the page.", 51 | parse: (args: string) => { 52 | return z 53 | .object({ 54 | key: z.string(), 55 | }) 56 | .parse(JSON.parse(args)); 57 | }, 58 | parameters: { 59 | type: "object", 60 | properties: { 61 | key: { 62 | type: "string", 63 | description: 64 | "The name of the key to press, e.g., 'Enter', 'ArrowDown', 'b'.", 65 | }, 66 | }, 67 | }, 68 | }, 69 | locateElement: { 70 | function: async (args: { cssSelector: string }) => { 71 | const locator = page.locator(args.cssSelector); 72 | const elementId = randomUUID(); 73 | await locator 74 | .first() 75 | .evaluate( 76 | (node, id) => node.setAttribute("data-element-id", id), 77 | elementId, 78 | ); 79 | return { elementId }; 80 | }, 81 | name: "locateElement", 82 | description: 83 | "Locates element using a CSS selector and returns elementId. This element ID can be used with other functions to perform actions on the element.", 84 | parse: (args: string) => { 85 | return z 86 | .object({ 87 | cssSelector: z.string(), 88 | }) 89 | .parse(JSON.parse(args)); 90 | }, 91 | parameters: { 92 | type: "object", 93 | properties: { 94 | cssSelector: { 95 | type: "string", 96 | }, 97 | }, 98 | }, 99 | }, 100 | locator_evaluate: { 101 | function: async (args: { pageFunction: string; elementId: string }) => { 102 | return { 103 | result: await getLocator(args.elementId).evaluate(args.pageFunction), 104 | }; 105 | }, 106 | description: 107 | "Execute JavaScript code in the page, taking the matching element as an argument.", 108 | name: "locator_evaluate", 109 | parameters: { 110 | type: "object", 111 | properties: { 112 | elementId: { 113 | type: "string", 114 | }, 115 | pageFunction: { 116 | type: "string", 117 | description: 118 | "Function to be evaluated in the page context, e.g. node => node.innerText", 119 | }, 120 | }, 121 | }, 122 | parse: (args: string) => { 123 | return z 124 | .object({ 125 | elementId: z.string(), 126 | pageFunction: z.string(), 127 | }) 128 | .parse(JSON.parse(args)); 129 | }, 130 | }, 131 | locator_getAttribute: { 132 | function: async (args: { attributeName: string; elementId: string }) => { 133 | return { 134 | attributeValue: await getLocator(args.elementId).getAttribute( 135 | args.attributeName, 136 | ), 137 | }; 138 | }, 139 | name: "locator_getAttribute", 140 | description: "Returns the matching element's attribute value.", 141 | parse: (args: string) => { 142 | return z 143 | .object({ 144 | elementId: z.string(), 145 | attributeName: z.string(), 146 | }) 147 | .parse(JSON.parse(args)); 148 | }, 149 | parameters: { 150 | type: "object", 151 | properties: { 152 | attributeName: { 153 | type: "string", 154 | }, 155 | elementId: { 156 | type: "string", 157 | }, 158 | }, 159 | }, 160 | }, 161 | locator_innerHTML: { 162 | function: async (args: { elementId: string }) => { 163 | return { innerHTML: await getLocator(args.elementId).innerHTML() }; 164 | }, 165 | name: "locator_innerHTML", 166 | description: "Returns the element.innerHTML.", 167 | parse: (args: string) => { 168 | return z 169 | .object({ 170 | elementId: z.string(), 171 | }) 172 | .parse(JSON.parse(args)); 173 | }, 174 | parameters: { 175 | type: "object", 176 | properties: { 177 | elementId: { 178 | type: "string", 179 | }, 180 | }, 181 | }, 182 | }, 183 | locator_innerText: { 184 | function: async (args: { elementId: string }) => { 185 | return { innerText: await getLocator(args.elementId).innerText() }; 186 | }, 187 | name: "locator_innerText", 188 | description: "Returns the element.innerText.", 189 | parse: (args: string) => { 190 | return z 191 | .object({ 192 | elementId: z.string(), 193 | }) 194 | .parse(JSON.parse(args)); 195 | }, 196 | parameters: { 197 | type: "object", 198 | properties: { 199 | elementId: { 200 | type: "string", 201 | }, 202 | }, 203 | }, 204 | }, 205 | locator_textContent: { 206 | function: async (args: { elementId: string }) => { 207 | return { 208 | textContent: await getLocator(args.elementId).textContent(), 209 | }; 210 | }, 211 | name: "locator_textContent", 212 | description: "Returns the node.textContent.", 213 | parse: (args: string) => { 214 | return z 215 | .object({ 216 | elementId: z.string(), 217 | }) 218 | .parse(JSON.parse(args)); 219 | }, 220 | parameters: { 221 | type: "object", 222 | properties: { 223 | elementId: { 224 | type: "string", 225 | }, 226 | }, 227 | }, 228 | }, 229 | locator_inputValue: { 230 | function: async (args: { elementId: string }) => { 231 | return { 232 | inputValue: await getLocator(args.elementId).inputValue(), 233 | }; 234 | }, 235 | name: "locator_inputValue", 236 | description: 237 | "Returns input.value for the selected or

or <select> element.",
 238 |       parse: (args: string) => {
 239 |         return z
 240 |           .object({
 241 |             elementId: z.string(),
 242 |           })
 243 |           .parse(JSON.parse(args));
 244 |       },
 245 |       parameters: {
 246 |         type: "object",
 247 |         properties: {
 248 |           elementId: {
 249 |             type: "string",
 250 |           },
 251 |         },
 252 |       },
 253 |     },
 254 |     locator_blur: {
 255 |       function: async (args: { elementId: string }) => {
 256 |         await getLocator(args.elementId).blur();
 257 | 
 258 |         return { success: true };
 259 |       },
 260 |       name: "locator_blur",
 261 |       description: "Removes keyboard focus from the current element.",
 262 |       parse: (args: string) => {
 263 |         return z
 264 |           .object({
 265 |             elementId: z.string(),
 266 |           })
 267 |           .parse(JSON.parse(args));
 268 |       },
 269 |       parameters: {
 270 |         type: "object",
 271 |         properties: {
 272 |           elementId: {
 273 |             type: "string",
 274 |           },
 275 |         },
 276 |       },
 277 |     },
 278 |     locator_boundingBox: {
 279 |       function: async (args: { elementId: string }) => {
 280 |         return await getLocator(args.elementId).boundingBox();
 281 |       },
 282 |       name: "locator_boundingBox",
 283 |       description:
 284 |         "This method returns the bounding box of the element matching the locator, or null if the element is not visible. The bounding box is calculated relative to the main frame viewport - which is usually the same as the browser window. The returned object has x, y, width, and height properties.",
 285 |       parse: (args: string) => {
 286 |         return z
 287 |           .object({
 288 |             elementId: z.string(),
 289 |           })
 290 |           .parse(JSON.parse(args));
 291 |       },
 292 |       parameters: {
 293 |         type: "object",
 294 |         properties: {
 295 |           elementId: {
 296 |             type: "string",
 297 |           },
 298 |         },
 299 |       },
 300 |     },
 301 |     locator_check: {
 302 |       function: async (args: { elementId: string }) => {
 303 |         await getLocator(args.elementId).check();
 304 | 
 305 |         return { success: true };
 306 |       },
 307 |       name: "locator_check",
 308 |       description: "Ensure that checkbox or radio element is checked.",
 309 |       parse: (args: string) => {
 310 |         return z
 311 |           .object({
 312 |             elementId: z.string(),
 313 |           })
 314 |           .parse(JSON.parse(args));
 315 |       },
 316 |       parameters: {
 317 |         type: "object",
 318 |         properties: {
 319 |           elementId: {
 320 |             type: "string",
 321 |           },
 322 |         },
 323 |       },
 324 |     },
 325 |     locator_uncheck: {
 326 |       function: async (args: { elementId: string }) => {
 327 |         await getLocator(args.elementId).uncheck();
 328 | 
 329 |         return { success: true };
 330 |       },
 331 |       name: "locator_uncheck",
 332 |       description: "Ensure that checkbox or radio element is unchecked.",
 333 |       parse: (args: string) => {
 334 |         return z
 335 |           .object({
 336 |             elementId: z.string(),
 337 |           })
 338 |           .parse(JSON.parse(args));
 339 |       },
 340 |       parameters: {
 341 |         type: "object",
 342 |         properties: {
 343 |           elementId: {
 344 |             type: "string",
 345 |           },
 346 |         },
 347 |       },
 348 |     },
 349 |     locator_isChecked: {
 350 |       function: async (args: { elementId: string }) => {
 351 |         return { isChecked: await getLocator(args.elementId).isChecked() };
 352 |       },
 353 |       name: "locator_isChecked",
 354 |       description: "Returns whether the element is checked.",
 355 |       parse: (args: string) => {
 356 |         return z
 357 |           .object({
 358 |             elementId: z.string(),
 359 |           })
 360 |           .parse(JSON.parse(args));
 361 |       },
 362 |       parameters: {
 363 |         type: "object",
 364 |         properties: {
 365 |           elementId: {
 366 |             type: "string",
 367 |           },
 368 |         },
 369 |       },
 370 |     },
 371 |     locator_isEditable: {
 372 |       function: async (args: { elementId: string }) => {
 373 |         return {
 374 |           isEditable: await getLocator(args.elementId).isEditable(),
 375 |         };
 376 |       },
 377 |       name: "locator_isEditable",
 378 |       description:
 379 |         "Returns whether the element is editable. Element is considered editable when it is enabled and does not have readonly property set.",
 380 |       parse: (args: string) => {
 381 |         return z
 382 |           .object({
 383 |             elementId: z.string(),
 384 |           })
 385 |           .parse(JSON.parse(args));
 386 |       },
 387 |       parameters: {
 388 |         type: "object",
 389 |         properties: {
 390 |           elementId: {
 391 |             type: "string",
 392 |           },
 393 |         },
 394 |       },
 395 |     },
 396 |     locator_isEnabled: {
 397 |       function: async (args: { elementId: string }) => {
 398 |         return { isEnabled: await getLocator(args.elementId).isEnabled() };
 399 |       },
 400 |       name: "locator_isEnabled",
 401 |       description:
 402 |         "Returns whether the element is enabled. Element is considered enabled unless it is a <button>, <select>, <input> or <textarea> with a disabled property.",
 403 |       parse: (args: string) => {
 404 |         return z
 405 |           .object({
 406 |             elementId: z.string(),
 407 |           })
 408 |           .parse(JSON.parse(args));
 409 |       },
 410 |       parameters: {
 411 |         type: "object",
 412 |         properties: {
 413 |           elementId: {
 414 |             type: "string",
 415 |           },
 416 |         },
 417 |       },
 418 |     },
 419 |     locator_isVisible: {
 420 |       function: async (args: { elementId: string }) => {
 421 |         return { isVisible: await getLocator(args.elementId).isVisible() };
 422 |       },
 423 |       name: "locator_isVisible",
 424 |       description: "Returns whether the element is visible.",
 425 |       parse: (args: string) => {
 426 |         return z
 427 |           .object({
 428 |             elementId: z.string(),
 429 |           })
 430 |           .parse(JSON.parse(args));
 431 |       },
 432 |       parameters: {
 433 |         type: "object",
 434 |         properties: {
 435 |           elementId: {
 436 |             type: "string",
 437 |           },
 438 |         },
 439 |       },
 440 |     },
 441 |     locator_clear: {
 442 |       function: async (args: { elementId: string }) => {
 443 |         await getLocator(args.elementId).clear();
 444 | 
 445 |         return { success: true };
 446 |       },
 447 |       name: "locator_clear",
 448 |       description: "Clear the input field.",
 449 |       parse: (args: string) => {
 450 |         return z
 451 |           .object({
 452 |             elementId: z.string(),
 453 |           })
 454 |           .parse(JSON.parse(args));
 455 |       },
 456 |       parameters: {
 457 |         type: "object",
 458 |         properties: {
 459 |           elementId: {
 460 |             type: "string",
 461 |           },
 462 |         },
 463 |       },
 464 |     },
 465 |     locator_click: {
 466 |       function: async (args: { elementId: string }) => {
 467 |         await getLocator(args.elementId).click();
 468 | 
 469 |         return { success: true };
 470 |       },
 471 |       name: "locator_click",
 472 |       description: "Click an element.",
 473 |       parse: (args: string) => {
 474 |         return z
 475 |           .object({
 476 |             elementId: z.string(),
 477 |           })
 478 |           .parse(JSON.parse(args));
 479 |       },
 480 |       parameters: {
 481 |         type: "object",
 482 |         properties: {
 483 |           elementId: {
 484 |             type: "string",
 485 |           },
 486 |         },
 487 |       },
 488 |     },
 489 |     locator_count: {
 490 |       function: async (args: { elementId: string }) => {
 491 |         return { elementCount: await getLocator(args.elementId).count() };
 492 |       },
 493 |       name: "locator_count",
 494 |       description: "Returns the number of elements matching the locator.",
 495 |       parse: (args: string) => {
 496 |         return z
 497 |           .object({
 498 |             elementId: z.string(),
 499 |           })
 500 |           .parse(JSON.parse(args));
 501 |       },
 502 |       parameters: {
 503 |         type: "object",
 504 |         properties: {
 505 |           elementId: {
 506 |             type: "string",
 507 |           },
 508 |         },
 509 |       },
 510 |     },
 511 |     locator_fill: {
 512 |       function: async (args: { value: string; elementId: string }) => {
 513 |         await getLocator(args.elementId).fill(args.value);
 514 | 
 515 |         return {
 516 |           success: true,
 517 |         };
 518 |       },
 519 |       name: "locator_fill",
 520 |       description: "Set a value to the input field.",
 521 |       parse: (args: string) => {
 522 |         return z
 523 |           .object({
 524 |             elementId: z.string(),
 525 |             value: z.string(),
 526 |           })
 527 |           .parse(JSON.parse(args));
 528 |       },
 529 |       parameters: {
 530 |         type: "object",
 531 |         properties: {
 532 |           value: {
 533 |             type: "string",
 534 |           },
 535 |           elementId: {
 536 |             type: "string",
 537 |           },
 538 |         },
 539 |       },
 540 |     },
 541 |     page_goto: {
 542 |       function: async (args: { url: string }) => {
 543 |         return {
 544 |           url: await page.goto(args.url),
 545 |         };
 546 |       },
 547 |       name: "page_goto",
 548 |       description: "Navigate to the specified URL.",
 549 |       parse: (args: string) => {
 550 |         return z
 551 |           .object({
 552 |             url: z.string(),
 553 |           })
 554 |           .parse(JSON.parse(args));
 555 |       },
 556 |       parameters: {
 557 |         type: "object",
 558 |         properties: {
 559 |           url: {
 560 |             type: "string",
 561 |             description: "The URL to navigate to",
 562 |           },
 563 |         },
 564 |         required: ["url"],
 565 |       },
 566 |     },
 567 |     locator_selectOption: {
 568 |       function: async (args: {
 569 |         elementId?: string;
 570 |         cssSelector?: string;
 571 |         value?: string | string[];
 572 |         label?: string | string[];
 573 |         index?: number | number[];
 574 |       }) => {
 575 |         const { elementId, cssSelector, value, label, index } = args;
 576 | 
 577 |         let locator;
 578 | 
 579 |         if (elementId) {
 580 |           locator = page.locator(`[data-element-id="${elementId}"]`);
 581 |         } else if (cssSelector) {
 582 |           locator = page.locator(cssSelector);
 583 |         } else {
 584 |           throw new Error(
 585 |             "You must provide either an elementId or a cssSelector.",
 586 |           );
 587 |         }
 588 | 
 589 |         if (value !== undefined) {
 590 |           await locator.selectOption(value);
 591 |         } else if (label !== undefined) {
 592 |           const options = Array.isArray(label)
 593 |             ? label.map((l) => ({ label: l }))
 594 |             : { label };
 595 |           await locator.selectOption(options);
 596 |         } else if (index !== undefined) {
 597 |           const options = Array.isArray(index)
 598 |             ? index.map((i) => ({ index: i }))
 599 |             : { index };
 600 |           await locator.selectOption(options);
 601 |         } else {
 602 |           throw new Error(
 603 |             "You must provide at least one of the parameters: value, label, or index.",
 604 |           );
 605 |         }
 606 | 
 607 |         return { success: true };
 608 |       },
 609 |       name: "locator_selectOption",
 610 |       description:
 611 |         "Selects option(s) in a <select> element. Requires either an elementId (obtained via locateElement) or a direct cssSelector.",
 612 |       parse: (args: string) => {
 613 |         return z
 614 |           .object({
 615 |             elementId: z.string().optional(),
 616 |             cssSelector: z.string().optional(),
 617 |             value: z.union([z.string(), z.array(z.string())]).optional(),
 618 |             label: z.union([z.string(), z.array(z.string())]).optional(),
 619 |             index: z.union([z.number(), z.array(z.number())]).optional(),
 620 |           })
 621 |           .refine(
 622 |             (data) =>
 623 |               data.elementId !== undefined || data.cssSelector !== undefined,
 624 |             {
 625 |               message: "Either elementId or cssSelector must be provided.",
 626 |             },
 627 |           )
 628 |           .refine(
 629 |             (data) =>
 630 |               data.value !== undefined ||
 631 |               data.label !== undefined ||
 632 |               data.index !== undefined,
 633 |             {
 634 |               message:
 635 |                 "At least one of value, label, or index must be provided.",
 636 |             },
 637 |           )
 638 |           .parse(JSON.parse(args));
 639 |       },
 640 |       parameters: {
 641 |         type: "object",
 642 |         properties: {
 643 |           elementId: {
 644 |             type: "string",
 645 |             description:
 646 |               "The ID of the <select> element, obtained via locateElement.",
 647 |           },
 648 |           cssSelector: {
 649 |             type: "string",
 650 |             description:
 651 |               "CSS selector to locate the <select> element directly, e.g., '#my-select' or 'form select'.",
 652 |           },
 653 |           value: {
 654 |             type: ["string", "array"],
 655 |             description:
 656 |               "Select options with matching value attribute. Can be a string or an array for multi-select.",
 657 |             items: {
 658 |               type: "string"
 659 |             }
 660 |           },
 661 |           label: {
 662 |             type: ["string", "array"],
 663 |             description:
 664 |               "Select options with matching visible text. Can be a string or an array for multi-select.",
 665 |             items: {
 666 |               type: "string"
 667 |             }
 668 |           },
 669 |           index: {
 670 |             type: ["number", "array"],
 671 |             description:
 672 |               "Select options by their index (zero-based). Can be a number or an array for multi-select.",
 673 |             items: {
 674 |               type: "number"
 675 |             }
 676 |           },
 677 |         },
 678 |       },
 679 |     },
 680 |     expect_toBe: {
 681 |       function: (args: { actual: string; expected: string }) => {
 682 |         return {
 683 |           actual: args.actual,
 684 |           expected: args.expected,
 685 |           success: args.actual === args.expected,
 686 |         };
 687 |       },
 688 |       name: "expect_toBe",
 689 |       description:
 690 |         "Asserts that the actual value is equal to the expected value.",
 691 |       parse: (args: string) => {
 692 |         return z
 693 |           .object({
 694 |             actual: z.string(),
 695 |             expected: z.string(),
 696 |           })
 697 |           .parse(JSON.parse(args));
 698 |       },
 699 |       parameters: {
 700 |         type: "object",
 701 |         properties: {
 702 |           actual: {
 703 |             type: "string",
 704 |           },
 705 |           expected: {
 706 |             type: "string",
 707 |           },
 708 |         },
 709 |       },
 710 |     },
 711 |     expect_notToBe: {
 712 |       function: (args: { actual: string; expected: string }) => {
 713 |         return {
 714 |           actual: args.actual,
 715 |           expected: args.expected,
 716 |           success: args.actual !== args.expected,
 717 |         };
 718 |       },
 719 |       name: "expect_notToBe",
 720 |       description:
 721 |         "Asserts that the actual value is not equal to the expected value.",
 722 |       parse: (args: string) => {
 723 |         return z
 724 |           .object({
 725 |             actual: z.string(),
 726 |             expected: z.string(),
 727 |           })
 728 |           .parse(JSON.parse(args));
 729 |       },
 730 |       parameters: {
 731 |         type: "object",
 732 |         properties: {
 733 |           actual: {
 734 |             type: "string",
 735 |           },
 736 |           expected: {
 737 |             type: "string",
 738 |           },
 739 |         },
 740 |       },
 741 |     },
 742 |     resultAssertion: {
 743 |       function: (args: { assertion: boolean }) => {
 744 |         return args;
 745 |       },
 746 |       parse: (args: string) => {
 747 |         return z
 748 |           .object({
 749 |             assertion: z.boolean(),
 750 |           })
 751 |           .parse(JSON.parse(args));
 752 |       },
 753 |       description:
 754 |         "This function is called when the initial instructions asked to assert something; then 'assertion' is either true or false (boolean) depending on whether the assertion succeeded.",
 755 |       name: "resultAssertion",
 756 |       parameters: {
 757 |         type: "object",
 758 |         properties: {
 759 |           assertion: {
 760 |             type: "boolean",
 761 |           },
 762 |         },
 763 |       },
 764 |     },
 765 |     resultQuery: {
 766 |       function: (args: { query: string }) => {
 767 |         return args;
 768 |       },
 769 |       parse: (args: string) => {
 770 |         return z
 771 |           .object({
 772 |             query: z.string(),
 773 |           })
 774 |           .parse(JSON.parse(args));
 775 |       },
 776 |       description:
 777 |         "This function is called at the end when the initial instructions asked to extract data; then 'query' property is set to a text value of the extracted data.",
 778 |       name: "resultQuery",
 779 |       parameters: {
 780 |         type: "object",
 781 |         properties: {
 782 |           query: {
 783 |             type: "string",
 784 |           },
 785 |         },
 786 |       },
 787 |     },
 788 |     resultAction: {
 789 |       function: () => {
 790 |         return { success: true };
 791 |       },
 792 |       parse: (args: string) => {
 793 |         return z.object({}).parse(JSON.parse(args));
 794 |       },
 795 |       description:
 796 |         "This function is called at the end when the initial instructions asked to perform an action.",
 797 |       name: "resultAction",
 798 |       parameters: {
 799 |         type: "object",
 800 |         properties: {},
 801 |       },
 802 |     },
 803 |     resultError: {
 804 |       function: (args: { errorMessage: string }) => {
 805 |         return {
 806 |           errorMessage: args.errorMessage,
 807 |         };
 808 |       },
 809 |       parse: (args: string) => {
 810 |         return z
 811 |           .object({
 812 |             errorMessage: z.string(),
 813 |           })
 814 |           .parse(JSON.parse(args));
 815 |       },
 816 |       description:
 817 |         "If user instructions cannot be completed, then this function is used to produce the final response.",
 818 |       name: "resultError",
 819 |       parameters: {
 820 |         type: "object",
 821 |         properties: {
 822 |           errorMessage: {
 823 |             type: "string",
 824 |           },
 825 |         },
 826 |       },
 827 |     },
 828 |     getVisibleStructure: {
 829 |       function: async () => {
 830 |         const sanitizeOptions = getSanitizeOptions();
 831 |         const allowedTags = sanitizeOptions.allowedTags || [];
 832 |         const allowedAttributes = sanitizeOptions.allowedAttributes;
 833 |         const maxDepth = 30; // Можно вынести наверх файла в константу при желании
 834 | 
 835 |         return {
 836 |           structure: await page.evaluate(
 837 |             ({ allowedTags, allowedAttributes, maxDepth }) => {
 838 |               // @ts-ignore
 839 |               const extractVisibleStructure = (element, depth = 0) => {
 840 |                 if (!element || depth > maxDepth) return null;
 841 | 
 842 |                 const style = window.getComputedStyle(element);
 843 |                 if (
 844 |                   style.display === "none" ||
 845 |                   style.visibility === "hidden" ||
 846 |                   style.opacity === "0"
 847 |                 ) {
 848 |                   return null;
 849 |                 }
 850 | 
 851 |                 const tag = element.tagName.toLowerCase();
 852 |                 if (!allowedTags.includes(tag)) {
 853 |                   return null;
 854 |                 }
 855 | 
 856 |                 const node = {
 857 |                   tag: tag,
 858 |                   attributes: {},
 859 |                   children: [],
 860 |                 };
 861 | 
 862 |                 const elementAttributes = element.attributes;
 863 |                 if (allowedAttributes === false) {
 864 |                   for (let i = 0; i < elementAttributes.length; i++) {
 865 |                     const attr = elementAttributes[i];
 866 |                     // @ts-ignore
 867 |                     node.attributes[attr.name] = attr.value;
 868 |                   }
 869 |                 } else if (typeof allowedAttributes === "object") {
 870 |                   const allowedForAll = allowedAttributes["*"];
 871 |                   const allowedForTag = allowedAttributes[tag];
 872 | 
 873 |                   // @ts-ignore
 874 |                   const allowAllForTag = allowedForTag === true;
 875 |                   // @ts-ignore
 876 |                   const allowAllGlobal = allowedForAll === true;
 877 | 
 878 |                   for (let i = 0; i < elementAttributes.length; i++) {
 879 |                     const attr = elementAttributes[i];
 880 |                     const attrName = attr.name;
 881 | 
 882 |                     if (
 883 |                       allowAllForTag ||
 884 |                       allowAllGlobal ||
 885 |                       (Array.isArray(allowedForTag) &&
 886 |                         allowedForTag.includes(attrName)) ||
 887 |                       (Array.isArray(allowedForAll) &&
 888 |                         allowedForAll.includes(attrName))
 889 |                     ) {
 890 |                       // @ts-ignore
 891 |                       node.attributes[attrName] = attr.value;
 892 |                     }
 893 |                   }
 894 |                 }
 895 | 
 896 |                 const id = element.id;
 897 |                 if (id) {
 898 |                   // @ts-ignore
 899 |                   node.id = id;
 900 |                 }
 901 | 
 902 |                 const role = element.getAttribute("role");
 903 |                 if (role) {
 904 |                   // @ts-ignore
 905 |                   node.role = role;
 906 |                 }
 907 | 
 908 |                 const ariaLabel = element.getAttribute("aria-label");
 909 |                 if (ariaLabel) {
 910 |                   // @ts-ignore
 911 |                   node.ariaLabel = ariaLabel;
 912 |                 }
 913 | 
 914 |                 const className = element.className?.trim();
 915 |                 if (className) {
 916 |                   // @ts-ignore
 917 |                   node.className = className;
 918 |                 }
 919 | 
 920 |                 if (
 921 |                   element.childNodes.length === 1 &&
 922 |                   element.childNodes[0].nodeType === 3
 923 |                 ) {
 924 |                   const text = element.textContent?.trim() || "";
 925 |                   if (text) {
 926 |                     // @ts-ignore
 927 |                     node.text =
 928 |                       text.length > 50 ? text.slice(0, 50) + "..." : text;
 929 |                   }
 930 |                 }
 931 | 
 932 |                 if (depth + 1 < maxDepth) {
 933 |                   for (let i = 0; i < element.children.length; i++) {
 934 |                     const child = extractVisibleStructure(
 935 |                       element.children[i],
 936 |                       depth + 1,
 937 |                     );
 938 |                     if (child) {
 939 |                       // @ts-ignore
 940 |                       node.children.push(child);
 941 |                     }
 942 |                   }
 943 |                 }
 944 | 
 945 |                 return node;
 946 |               };
 947 | 
 948 |               return extractVisibleStructure(document.body);
 949 |             },
 950 |             { allowedTags, allowedAttributes, maxDepth },
 951 |           ),
 952 |         };
 953 |       },
 954 |       name: "getVisibleStructure",
 955 |       description:
 956 |         "Returns a simplified hierarchical structure of visible DOM elements, focusing on roles, attributes, and basic content.",
 957 |       parse: (args: string) => {
 958 |         return z.object({}).parse(JSON.parse(args));
 959 |       },
 960 |       parameters: {
 961 |         type: "object",
 962 |         properties: {},
 963 |       },
 964 |     },
 965 |     locateElementsByRole: {
 966 |       function: async (args: {
 967 |         role:
 968 |           | "alert"
 969 |           | "alertdialog"
 970 |           | "application"
 971 |           | "article"
 972 |           | "banner"
 973 |           | "blockquote"
 974 |           | "button"
 975 |           | "caption"
 976 |           | "cell"
 977 |           | "checkbox"
 978 |           | "code"
 979 |           | "columnheader"
 980 |           | "combobox"
 981 |           | "complementary"
 982 |           | "contentinfo"
 983 |           | "definition"
 984 |           | "deletion"
 985 |           | "dialog"
 986 |           | "directory"
 987 |           | "document"
 988 |           | "emphasis"
 989 |           | "feed"
 990 |           | "figure"
 991 |           | "form"
 992 |           | "generic"
 993 |           | "grid"
 994 |           | "gridcell"
 995 |           | "group"
 996 |           | "heading"
 997 |           | "img"
 998 |           | "insertion"
 999 |           | "link"
1000 |           | "list"
1001 |           | "listbox"
1002 |           | "listitem"
1003 |           | "log"
1004 |           | "main"
1005 |           | "marquee"
1006 |           | "math"
1007 |           | "menu"
1008 |           | "menubar"
1009 |           | "menuitem"
1010 |           | "menuitemcheckbox"
1011 |           | "menuitemradio"
1012 |           | "meter"
1013 |           | "navigation"
1014 |           | "none"
1015 |           | "note"
1016 |           | "option"
1017 |           | "paragraph"
1018 |           | "presentation"
1019 |           | "progressbar"
1020 |           | "radio"
1021 |           | "radiogroup"
1022 |           | "region"
1023 |           | "row"
1024 |           | "rowgroup"
1025 |           | "rowheader"
1026 |           | "scrollbar"
1027 |           | "search"
1028 |           | "searchbox"
1029 |           | "separator"
1030 |           | "slider"
1031 |           | "spinbutton"
1032 |           | "status"
1033 |           | "strong"
1034 |           | "subscript"
1035 |           | "superscript"
1036 |           | "switch"
1037 |           | "tab"
1038 |           | "table"
1039 |           | "tablist"
1040 |           | "tabpanel"
1041 |           | "term"
1042 |           | "textbox"
1043 |           | "time"
1044 |           | "timer"
1045 |           | "toolbar"
1046 |           | "tooltip"
1047 |           | "tree"
1048 |           | "treegrid"
1049 |           | "treeitem";
1050 |         exact?: boolean;
1051 |       }) => {
1052 |         const locators = await page
1053 |           .getByRole(args.role, { exact: args.exact ?? false })
1054 |           .all();
1055 |         const elementIds: string[] = [];
1056 | 
1057 |         for (const locator of locators) {
1058 |           const elementId = randomUUID();
1059 |           await locator.evaluate(
1060 |             (node, id) => node.setAttribute("data-element-id", id),
1061 |             elementId,
1062 |           );
1063 |           elementIds.push(elementId);
1064 |         }
1065 | 
1066 |         return {
1067 |           elementIds,
1068 |           count: elementIds.length,
1069 |         };
1070 |       },
1071 |       name: "locateElementsByRole",
1072 |       description:
1073 |         "Finds elements by their ARIA role attribute and returns array of element IDs.",
1074 |       parse: (args: string) => {
1075 |         return z
1076 |           .object({
1077 |             role: z.string(),
1078 |             exact: z.boolean().optional(),
1079 |           })
1080 |           .parse(JSON.parse(args));
1081 |       },
1082 |       parameters: {
1083 |         type: "object",
1084 |         properties: {
1085 |           role: {
1086 |             type: "string",
1087 |             description:
1088 |               "ARIA role to search for, e.g. 'button', 'grid', 'row', etc.",
1089 |           },
1090 |           exact: {
1091 |             type: "boolean",
1092 |             description:
1093 |               "Whether to match the role exactly or allow partial matches.",
1094 |           },
1095 |         },
1096 |         required: ["role"],
1097 |       },
1098 |     },
1099 |     locateElementsWithText: {
1100 |       function: async (args: { text: string; exact?: boolean }) => {
1101 |         const allLocators = await page
1102 |           .getByText(args.text, { exact: args.exact ?? false })
1103 |           .all();
1104 | 
1105 |         const elementIds: string[] = [];
1106 | 
1107 |         for (const locator of allLocators) {
1108 |           if (await locator.isVisible()) {
1109 |             const elementId = randomUUID();
1110 |             await locator.evaluate(
1111 |               (node, id) => node.setAttribute("data-element-id", id),
1112 |               elementId,
1113 |             );
1114 |             elementIds.push(elementId);
1115 |           }
1116 |         }
1117 | 
1118 |         return {
1119 |           elementIds,
1120 |           count: elementIds.length,
1121 |         };
1122 |       },
1123 |       name: "locateElementsWithText",
1124 |       description:
1125 |         "Finds visible elements containing specified text and returns array of element IDs. Hidden elements are excluded.",
1126 |       parse: (args: string) => {
1127 |         return z
1128 |           .object({
1129 |             text: z.string(),
1130 |             exact: z.boolean().optional(),
1131 |           })
1132 |           .parse(JSON.parse(args));
1133 |       },
1134 |       parameters: {
1135 |         type: "object",
1136 |         properties: {
1137 |           text: {
1138 |             type: "string",
1139 |             description: "Text to search for within elements.",
1140 |           },
1141 |           exact: {
1142 |             type: "boolean",
1143 |             description:
1144 |               "Whether to match the text exactly or allow partial matches.",
1145 |           },
1146 |         },
1147 |         required: ["text"],
1148 |       },
1149 |     },
1150 |     waitForContentToLoad: {
1151 |       function: async (args: {
1152 |         selector: string;
1153 |         textMarker?: string;
1154 |         timeout?: number;
1155 |       }) => {
1156 |         try {
1157 |           if (args.textMarker) {
1158 |             await page.waitForSelector(
1159 |               `${args.selector}:has-text("${args.textMarker}")`,
1160 |               {
1161 |                 timeout: args.timeout || 30000,
1162 |                 state: "visible",
1163 |               },
1164 |             );
1165 |           } else {
1166 |             await page.waitForSelector(args.selector, {
1167 |               timeout: args.timeout || 30000,
1168 |               state: "visible",
1169 |             });
1170 |           }
1171 |           return { success: true };
1172 |         } catch (error) {
1173 |           return {
1174 |             success: false,
1175 |             error: `Timeout waiting for content to load: ${error.message}`,
1176 |           };
1177 |         }
1178 |       },
1179 |       name: "waitForContentToLoad",
1180 |       description:
1181 |         "Waits for dynamic content to load based on selector and optional text marker.",
1182 |       parse: (args: string) => {
1183 |         return z
1184 |           .object({
1185 |             selector: z.string(),
1186 |             textMarker: z.string().optional(),
1187 |             timeout: z.number().optional(),
1188 |           })
1189 |           .parse(JSON.parse(args));
1190 |       },
1191 |       parameters: {
1192 |         type: "object",
1193 |         properties: {
1194 |           selector: {
1195 |             type: "string",
1196 |             description: "CSS selector to wait for.",
1197 |           },
1198 |           textMarker: {
1199 |             type: "string",
1200 |             description:
1201 |               "Optional text content to wait for within the selector.",
1202 |           },
1203 |           timeout: {
1204 |             type: "number",
1205 |             description:
1206 |               "Maximum time to wait in milliseconds. Default is 30000 (30 seconds).",
1207 |           },
1208 |         },
1209 |         required: ["selector"],
1210 |       },
1211 |     },
1212 |     extractVisibleText: {
1213 |       function: async (args: { elementId?: string; selector?: string }) => {
1214 |         let result;
1215 | 
1216 |         if (args.elementId) {
1217 |           result = await getLocator(args.elementId).evaluate(
1218 |             (node: Element) => {
1219 |               const getVisibleText = (element: Element | Node): string => {
1220 |                 if (element.nodeType === 3) {
1221 |                   return element.textContent?.trim() || "";
1222 |                 }
1223 | 
1224 |                 if (element instanceof Element) {
1225 |                   const style = window.getComputedStyle(element);
1226 |                   if (
1227 |                     style.display === "none" ||
1228 |                     style.visibility === "hidden" ||
1229 |                     style.opacity === "0"
1230 |                   ) {
1231 |                     return "";
1232 |                   }
1233 | 
1234 |                   let text = "";
1235 |                   Array.from(element.childNodes).forEach((child) => {
1236 |                     text += getVisibleText(child);
1237 |                   });
1238 | 
1239 |                   return text;
1240 |                 }
1241 | 
1242 |                 return "";
1243 |               };
1244 | 
1245 |               return getVisibleText(node);
1246 |             },
1247 |           );
1248 |         } else if (args.selector) {
1249 |           result = await page.evaluate((selector: string) => {
1250 |             const elements = document.querySelectorAll(selector);
1251 |             let allText = "";
1252 | 
1253 |             elements.forEach((element) => {
1254 |               const style = window.getComputedStyle(element);
1255 |               if (
1256 |                 style.display !== "none" &&
1257 |                 style.visibility !== "hidden" &&
1258 |                 style.opacity !== "0"
1259 |               ) {
1260 |                 allText += (element.textContent?.trim() || "") + " ";
1261 |               }
1262 |             });
1263 | 
1264 |             return allText.trim();
1265 |           }, args.selector);
1266 |         } else {
1267 |           throw new Error("Either elementId or selector must be provided");
1268 |         }
1269 | 
1270 |         return { text: result };
1271 |       },
1272 |       name: "extractVisibleText",
1273 |       description:
1274 |         "Extracts only visible text from elements, ignoring hidden content.",
1275 |       parse: (args: string) => {
1276 |         return z
1277 |           .object({
1278 |             elementId: z.string().optional(),
1279 |             selector: z.string().optional(),
1280 |           })
1281 |           .refine(
1282 |             (data) =>
1283 |               data.elementId !== undefined || data.selector !== undefined,
1284 |             {
1285 |               message: "Either elementId or selector must be provided",
1286 |             },
1287 |           )
1288 |           .parse(JSON.parse(args));
1289 |       },
1290 |       parameters: {
1291 |         type: "object",
1292 |         properties: {
1293 |           elementId: {
1294 |             type: "string",
1295 |             description: "ID of the element to extract text from.",
1296 |           },
1297 |           selector: {
1298 |             type: "string",
1299 |             description: "CSS selector to locate elements for text extraction.",
1300 |           },
1301 |         },
1302 |       },
1303 |     },
1304 |     scrollIntoElementView: {
1305 |       function: async (args: { elementId: string; behavior?: string }) => {
1306 |         await getLocator(args.elementId).evaluate(
1307 |           (node: Element, behavior: string | undefined) => {
1308 |             node.scrollIntoView({
1309 |               behavior: (behavior as "auto" | "smooth") || "smooth",
1310 |               block: "center",
1311 |             });
1312 |           },
1313 |           args.behavior,
1314 |         );
1315 | 
1316 |         await page.waitForTimeout(500);
1317 | 
1318 |         return { success: true };
1319 |       },
1320 |       name: "scrollIntoElementView",
1321 |       description:
1322 |         "Scrolls to bring an element into view, useful for loading content dynamically as user scrolls.",
1323 |       parse: (args: string) => {
1324 |         return z
1325 |           .object({
1326 |             elementId: z.string(),
1327 |             behavior: z.enum(["auto", "smooth"]).optional(),
1328 |           })
1329 |           .parse(JSON.parse(args));
1330 |       },
1331 |       parameters: {
1332 |         type: "object",
1333 |         properties: {
1334 |           elementId: {
1335 |             type: "string",
1336 |             description: "ID of the element to scroll into view.",
1337 |           },
1338 |           behavior: {
1339 |             type: "string",
1340 |             enum: ["auto", "smooth"],
1341 |             description:
1342 |               "Scrolling behavior: 'auto' for instant scrolling or 'smooth' for animated scrolling.",
1343 |           },
1344 |         },
1345 |         required: ["elementId"],
1346 |       },
1347 |     },
1348 |     waitForNetworkIdle: {
1349 |       function: async (args: { timeout?: number; idleTime?: number }) => {
1350 |         try {
1351 |           await page.waitForLoadState("networkidle", {
1352 |             timeout: args.timeout || 30000,
1353 |           });
1354 | 
1355 |           if (args.idleTime) {
1356 |             await page.waitForTimeout(args.idleTime);
1357 |           }
1358 | 
1359 |           return { success: true };
1360 |         } catch (error) {
1361 |           return {
1362 |             success: false,
1363 |             error: `Timeout waiting for network idle: ${error.message}`,
1364 |           };
1365 |         }
1366 |       },
1367 |       name: "waitForNetworkIdle",
1368 |       description:
1369 |         "Waits for network activity to be minimal or stopped, useful for SPA applications.",
1370 |       parse: (args: string) => {
1371 |         return z
1372 |           .object({
1373 |             timeout: z.number().optional(),
1374 |             idleTime: z.number().optional(),
1375 |           })
1376 |           .parse(JSON.parse(args));
1377 |       },
1378 |       parameters: {
1379 |         type: "object",
1380 |         properties: {
1381 |           timeout: {
1382 |             type: "number",
1383 |             description:
1384 |               "Maximum time to wait in milliseconds. Default is 30000 (30 seconds).",
1385 |           },
1386 |           idleTime: {
1387 |             type: "number",
1388 |             description:
1389 |               "Additional wait time after network becomes idle, in milliseconds.",
1390 |           },
1391 |         },
1392 |       },
1393 |     },
1394 |   };
1395 | };
1396 |

--------------------------------------------------------------------------------