├── .env.example
├── .eslintignore
├── .eslintrc
├── .github
    ├── CODEOWNERS
    ├── ISSUE_TEMPLATE
    │   ├── bug_report.md
    │   └── feature_request.md
    ├── auto_assign.yml
    ├── dependabot.yml
    ├── stale.yml
    └── workflows
    │   ├── auto-assign.yml
    │   ├── build-zip.yml
    │   ├── greetings.yml
    │   └── test.yml
├── .gitignore
├── .husky
    ├── commit-msg
    └── pre-commit
├── .npmrc
├── .nvmrc
├── .prettierignore
├── .prettierrc
├── CONTRIBUTING.md
├── CONTRIBUTING_KNOWLEDGE.md
├── LICENSE
├── PULL_REQUEST_TEMPLATE.md
├── README.md
├── TROUBLESHOOTING.md
├── commitlint.config.js
├── jest.config.js
├── manifest.js
├── media
    └── web-annotation.png
├── package.json
├── package.lib.json
├── pnpm-lock.yaml
├── postcss.config.js
├── public
    └── icon-128.png
├── rollup.lib.config.js
├── src
    ├── assets
    │   ├── img
    │   │   └── logo.svg
    │   └── style
    │   │   └── theme.scss
    ├── common
    │   ├── App.tsx
    │   ├── AutosizeTextarea.tsx
    │   ├── CopyButton.tsx
    │   ├── CustomKnowledgeBase
    │   │   ├── DefaultKnowledge.tsx
    │   │   ├── DuplicateKnowledgeAlert.tsx
    │   │   ├── HostKnowledge.tsx
    │   │   ├── NewKnowledgeForm.tsx
    │   │   ├── NewKnowledgeJson.tsx
    │   │   ├── Notes.tsx
    │   │   └── index.tsx
    │   ├── RecommendedTasks.tsx
    │   ├── RunTaskButton.tsx
    │   ├── Settings.tsx
    │   ├── TaskHistory.tsx
    │   ├── TaskStatus.tsx
    │   ├── TaskUI.tsx
    │   ├── TokenCount.tsx
    │   ├── VoiceButton.tsx
    │   └── settings
    │   │   ├── AgentModeDropdown.tsx
    │   │   ├── ModelDropdown.tsx
    │   │   └── SetAPIKey.tsx
    ├── constants.ts
    ├── environment.d.ts
    ├── global.d.ts
    ├── helpers
    │   ├── aiSdkUtils.ts
    │   ├── browserUtils.ts
    │   ├── buildAnnotatedScreenshots.ts
    │   ├── chromeDebugger.ts
    │   ├── countTokens.ts
    │   ├── disableExtensions.ts
    │   ├── dom-agent
    │   │   ├── availableActions.ts
    │   │   ├── determineNextAction.ts
    │   │   └── parseResponse.ts
    │   ├── errorChecker.ts
    │   ├── index.ts
    │   ├── knowledge
    │   │   ├── db.json
    │   │   ├── index.ts
    │   │   └── redirects.json
    │   ├── rpc
    │   │   ├── domActions.ts
    │   │   ├── pageRPC.ts
    │   │   ├── performAction.ts
    │   │   ├── runtimeFunctionStrings.ts
    │   │   └── utils.ts
    │   ├── shrinkHTML
    │   │   ├── tagsSelfClose.ts
    │   │   ├── templatize.test.ts
    │   │   └── templatize.ts
    │   ├── simplifyDom.ts
    │   ├── utils.ts
    │   ├── vision-agent
    │   │   ├── determineNavigateAction.ts
    │   │   ├── determineNextAction.ts
    │   │   ├── parseResponse.ts
    │   │   └── tools.ts
    │   └── voiceControl.ts
    ├── pages
    │   ├── background
    │   │   └── index.ts
    │   ├── content
    │   │   ├── attachFile.ts
    │   │   ├── copyToClipboard.ts
    │   │   ├── domOperations.ts
    │   │   ├── drawLabels.ts
    │   │   ├── getAnnotatedDOM.ts
    │   │   ├── getViewportPercentage.ts
    │   │   ├── index.ts
    │   │   ├── injected.ts
    │   │   ├── mainWorld
    │   │   │   ├── index.ts
    │   │   │   └── mainWorld.ts
    │   │   ├── permission.ts
    │   │   ├── reverseMarkdown.ts
    │   │   ├── ripple.ts
    │   │   ├── style.global.scss
    │   │   └── style.scss
    │   ├── devtools
    │   │   ├── index.html
    │   │   └── index.ts
    │   ├── newtab
    │   │   ├── Newtab.css
    │   │   ├── Newtab.scss
    │   │   ├── Newtab.tsx
    │   │   ├── index.css
    │   │   ├── index.html
    │   │   └── index.tsx
    │   ├── options
    │   │   ├── Options.css
    │   │   ├── Options.tsx
    │   │   ├── index.css
    │   │   ├── index.html
    │   │   └── index.tsx
    │   ├── panel
    │   │   ├── Panel.css
    │   │   ├── Panel.tsx
    │   │   ├── index.css
    │   │   ├── index.html
    │   │   └── index.tsx
    │   ├── permission
    │   │   ├── index.html
    │   │   └── requestPermission.ts
    │   ├── popup
    │   │   ├── Popup.css
    │   │   ├── Popup.tsx
    │   │   ├── index.css
    │   │   ├── index.html
    │   │   └── index.tsx
    │   └── sidepanel
    │   │   ├── index.css
    │   │   ├── index.html
    │   │   └── index.tsx
    ├── shared
    │   ├── hoc
    │   │   ├── withErrorBoundary.tsx
    │   │   └── withSuspense.tsx
    │   ├── hooks
    │   │   └── useStorage.tsx
    │   ├── images
    │   │   └── mergeScreenshots.ts
    │   └── storages
    │   │   ├── base.ts
    │   │   └── exampleThemeStorage.ts
    ├── state
    │   ├── currentTask.ts
    │   ├── settings.ts
    │   ├── store.ts
    │   └── ui.ts
    └── vite-env.d.ts
├── tailwind.config.js
├── test-utils
    └── jest.setup.js
├── tsconfig.json
├── utils
    ├── log.ts
    ├── manifest-parser
    │   └── index.ts
    ├── plugins
    │   ├── add-hmr.ts
    │   ├── custom-dynamic-import.ts
    │   ├── inline-vite-preload-script.ts
    │   ├── make-manifest.ts
    │   └── watch-rebuild.ts
    └── reload
    │   ├── constant.ts
    │   ├── initReloadClient.ts
    │   ├── initReloadServer.ts
    │   ├── injections
    │       ├── script.ts
    │       └── view.ts
    │   ├── interpreter
    │       ├── index.ts
    │       └── types.ts
    │   ├── rollup.config.mjs
    │   └── utils.ts
└── vite.config.ts


/.env.example:
--------------------------------------------------------------------------------
1 | VITE_DEBUG_MODE=true
2 | 


--------------------------------------------------------------------------------
/.eslintignore:
--------------------------------------------------------------------------------
1 | dist
2 | node_modules
3 | 


--------------------------------------------------------------------------------
/.eslintrc:
--------------------------------------------------------------------------------
 1 | {
 2 |   "env": {
 3 |     "browser": true,
 4 |     "es6": true,
 5 |     "node": true
 6 |   },
 7 |   "extends": [
 8 |     "eslint:recommended",
 9 |     "plugin:react/recommended",
10 |     "plugin:@typescript-eslint/recommended",
11 |     "plugin:react-hooks/recommended",
12 |     "plugin:import/recommended",
13 |     "plugin:jsx-a11y/recommended",
14 |     "prettier"
15 |   ],
16 |   "parser": "@typescript-eslint/parser",
17 |   "parserOptions": {
18 |     "ecmaFeatures": {
19 |       "jsx": true
20 |     },
21 |     "ecmaVersion": "latest",
22 |     "sourceType": "module"
23 |   },
24 |   "plugins": [
25 |     "react",
26 |     "@typescript-eslint",
27 |     "react-hooks",
28 |     "import",
29 |     "jsx-a11y",
30 |     "prettier"
31 |   ],
32 |   "settings": {
33 |     "react": {
34 |       "version": "detect"
35 |     }
36 |   },
37 |   "rules": {
38 |     "prefer-promise-reject-errors": "error",
39 |     "no-throw-literal": "error",
40 |     "react/react-in-jsx-scope": "off",
41 |     "import/no-unresolved": "off"
42 |   },
43 |   "globals": {
44 |     "chrome": "readonly"
45 |   },
46 |   "ignorePatterns": ["watch.js", "dist/**"]
47 | }
48 | 


--------------------------------------------------------------------------------
/.github/CODEOWNERS:
--------------------------------------------------------------------------------
1 | * @mondaychen


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/bug_report.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Bug report
 3 | about: Create a report to help us improve
 4 | title: ''
 5 | labels: bug
 6 | assignees: Jonghakseo
 7 | 
 8 | ---
 9 | 
10 | **Describe the bug**
11 | A clear and concise description of what the bug is.
12 | 
13 | **To Reproduce**
14 | Steps to reproduce the behavior:
15 | 1. Go to '...'
16 | 2. Click on '....'
17 | 3. Scroll down to '....'
18 | 4. See error
19 | 
20 | **Expected behavior**
21 | A clear and concise description of what you expected to happen.
22 | 
23 | **Screenshots**
24 | If applicable, add screenshots to help explain your problem.
25 | 
26 | **Desktop (please complete the following information):**
27 |  - OS: [e.g. Mac, Window, Linux]
28 |  - Browser [e.g. chrome, firefox]
29 |  - Node Version [e.g. 18.12.0]
30 | 
31 | **Additional context**
32 | Add any other context about the problem here.
33 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/feature_request.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Feature request
 3 | about: Suggest an idea for this project
 4 | title: ''
 5 | labels: enhancement
 6 | assignees: Jonghakseo
 7 | 
 8 | ---
 9 | 
10 | **Is your feature request related to a problem? Please describe.**
11 | A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]
12 | 
13 | **Describe the solution you'd like**
14 | A clear and concise description of what you want to happen.
15 | 
16 | **Describe alternatives you've considered**
17 | A clear and concise description of any alternative solutions or features you've considered.
18 | 
19 | **Additional context**
20 | Add any other context or screenshots about the feature request here.
21 | 


--------------------------------------------------------------------------------
/.github/auto_assign.yml:
--------------------------------------------------------------------------------
 1 | # Set to true to add reviewers to pull requests
 2 | addReviewers: true
 3 | 
 4 | # Set to true to add assignees to pull requests
 5 | addAssignees: author
 6 | 
 7 | # A list of reviewers to be added to pull requests (GitHub user name)
 8 | reviewers:
 9 |   - mondaychen
10 | 
11 | # A number of reviewers added to the pull request
12 | # Set 0 to add all the reviewers (default: 0)
13 | numberOfReviewers: 0
14 | 
15 | # A list of assignees, overrides reviewers if set
16 | # assignees:
17 | #   - assigneeA
18 | 
19 | # A number of assignees to add to the pull request
20 | # Set to 0 to add all of the assignees.
21 | # Uses numberOfReviewers if unset.
22 | # numberOfAssignees: 2
23 | 
24 | # A list of keywords to be skipped the process that add reviewers if pull requests include it
25 | # skipKeywords:
26 | #   - wip
27 | 
28 | filterLabels:
29 |   exclude:
30 |     - dependencies
31 | 


--------------------------------------------------------------------------------
/.github/dependabot.yml:
--------------------------------------------------------------------------------
 1 | # To get started with Dependabot version updates, you'll need to specify which
 2 | # package ecosystems to update and where the package manifests are located.
 3 | # Please see the documentation for all configuration options:
 4 | # https://docs.github.com/github/administering-a-repository/configuration-options-for-dependency-updates
 5 | 
 6 | version: 2
 7 | updates:
 8 |   - package-ecosystem: "npm" # See documentation for possible values
 9 |     directory: "/" # Location of package manifests
10 |     schedule:
11 |       interval: "weekly"
12 | 


--------------------------------------------------------------------------------
/.github/stale.yml:
--------------------------------------------------------------------------------
 1 | # Number of days of inactivity before an Issue or Pull Request becomes stale
 2 | daysUntilStale: 90
 3 | # Number of days of inactivity before a stale Issue or Pull Request is closed
 4 | daysUntilClose: 30
 5 | # Issues or Pull Requests with these labels will never be considered stale. Set to `[]` to disable
 6 | exemptLabels:
 7 |   - pinned
 8 |   - security
 9 | # Label to use when marking as stale
10 | staleLabel: stale
11 | # Comment to post when marking as stale. Set to `false` to disable
12 | markComment: >
13 |   This issue has been automatically marked as stale because it has not had
14 |   recent activity. It will be closed if no further activity occurs. Thank you
15 |   for your contributions.
16 | # Comment to post when removing the stale label. Set to `false` to disable
17 | unmarkComment: false
18 | # Comment to post when closing a stale Issue or Pull Request. Set to `false` to disable
19 | closeComment: ture
20 | # Limit to only `issues` or `pulls`
21 | only: issues
22 | 


--------------------------------------------------------------------------------
/.github/workflows/auto-assign.yml:
--------------------------------------------------------------------------------
 1 | name: 'Auto Assign'
 2 | on:
 3 |   pull_request:
 4 |     types: [opened, ready_for_review]
 5 | 
 6 | jobs:
 7 |   add-reviews:
 8 |     runs-on: ubuntu-latest
 9 |     steps:
10 |       - uses: kentaro-m/auto-assign-action@v1.2.5
11 |         with:
12 |           configuration-path: '.github/auto_assign.yml'
13 | 


--------------------------------------------------------------------------------
/.github/workflows/build-zip.yml:
--------------------------------------------------------------------------------
 1 | name: Build And Upload Extension Zip Via Artifact
 2 | 
 3 | on:
 4 |   push:
 5 |     branches: [ main ]
 6 |   pull_request:
 7 | 
 8 | jobs:
 9 |   build:
10 | 
11 |     runs-on: ubuntu-latest
12 | 
13 |     steps:
14 |       - uses: actions/checkout@v3
15 | 
16 |       - name: Setup Node.js
17 |         uses: actions/setup-node@v3
18 |         with:
19 |           node-version-file: ".nvmrc"
20 | 
21 |       - uses: actions/cache@v3
22 |         with:
23 |           path: node_modules
24 |           key: ${{ runner.OS }}-build-${{ hashFiles('**/package-lock.json') }}
25 | 
26 |       - uses: pnpm/action-setup@v2
27 | 
28 |       - run: pnpm install --frozen-lockfile
29 | 
30 |       - run: pnpm build
31 | 
32 |       - uses: actions/upload-artifact@v3
33 |         with:
34 |           name: fuji-extension
35 |           path: dist/*
36 | 


--------------------------------------------------------------------------------
/.github/workflows/greetings.yml:
--------------------------------------------------------------------------------
 1 | name: Greetings
 2 | 
 3 | on: [pull_request_target, issues]
 4 | 
 5 | jobs:
 6 |   greeting:
 7 |     runs-on: ubuntu-latest
 8 |     permissions:
 9 |       issues: write
10 |       pull-requests: write
11 |     steps:
12 |     - uses: actions/first-interaction@v1
13 |       with:
14 |         repo-token: ${{ secrets.GITHUB_TOKEN }}
15 |         issue-message: 'Thank you for your contribution. We will check and reply to you as soon as possible.'
16 |         pr-message: 'Thank you for your contribution. We will check and reply to you as soon as possible.'
17 | 


--------------------------------------------------------------------------------
/.github/workflows/test.yml:
--------------------------------------------------------------------------------
 1 | name: Test
 2 | 
 3 | on:
 4 |   push:
 5 |     branches: [ main ]
 6 |   pull_request:
 7 | 
 8 | jobs:
 9 |   test:
10 |     runs-on: ubuntu-latest
11 | 
12 |     steps:
13 |       - uses: actions/checkout@v3
14 | 
15 |       - name: Setup Node.js
16 |         uses: actions/setup-node@v3
17 |         with:
18 |           node-version-file: ".nvmrc"
19 | 
20 |       - uses: actions/cache@v3
21 |         with:
22 |           path: node_modules
23 |           key: ${{ runner.OS }}-build-${{ hashFiles('**/package-lock.json') }}
24 | 
25 |       - uses: pnpm/action-setup@v2
26 | 
27 |       - run: pnpm install --frozen-lockfile
28 | 
29 |       - run: pnpm test
30 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | # dependencies
 2 | /node_modules
 3 | 
 4 | # testing
 5 | /coverage
 6 | 
 7 | # build
 8 | /dist
 9 | /dist-lib
10 | 
11 | # etc
12 | .DS_Store
13 | .env.local
14 | .env
15 | .idea
16 | 
17 | # compiled
18 | utils/reload/*.js
19 | utils/reload/injections/*.js
20 | public/manifest.json
21 | 


--------------------------------------------------------------------------------
/.husky/commit-msg:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env sh
2 | . "$(dirname -- "$0")/_/husky.sh"
3 | 
4 | npm run commitlint ${1}
5 | 


--------------------------------------------------------------------------------
/.husky/pre-commit:
--------------------------------------------------------------------------------
1 | #!/usr/bin/env sh
2 | . "$(dirname -- "$0")/_/husky.sh"
3 | 
4 | npx lint-staged
5 | 


--------------------------------------------------------------------------------
/.npmrc:
--------------------------------------------------------------------------------
1 | public-hoist-pattern[]=@testing-library/dom
2 | 


--------------------------------------------------------------------------------
/.nvmrc:
--------------------------------------------------------------------------------
1 | 22.11.0
2 | 


--------------------------------------------------------------------------------
/.prettierignore:
--------------------------------------------------------------------------------
 1 | dist
 2 | node_modules
 3 | .gitignore
 4 | .github
 5 | .eslintignore
 6 | .husky
 7 | .nvmrc
 8 | .prettierignore
 9 | LICENSE
10 | *.md
11 | pnpm-lock.yaml


--------------------------------------------------------------------------------
/.prettierrc:
--------------------------------------------------------------------------------
1 | {
2 |   "semi": true,
3 |   "printWidth": 80
4 | }
5 | 


--------------------------------------------------------------------------------
/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contributing to Fuji-Web
 2 | 
 3 | Thank you for your interest in contributing to Fuji-Web! Fuji-Web is a tool that simplifies web interactions through the innovative use of multi-modal Large Language Models, offering users a more intuitive and efficient online experience. We welcome contributions from the community to help make Fuji-Web even better.
 4 | 
 5 | ## How to Contribute
 6 | 
 7 | There are many ways to contribute to Fuji-Web, from writing code to improving documentation, reporting bugs, and suggesting enhancements. Here's how you can get started:
 8 | 
 9 | ### Spread the Word
10 | If you love Fuji-Web, you can make a big difference by telling others about it. Write a blog post, talk about it on social media, or share your experience with friends and colleagues. Every bit helps in growing our community and bringing new contributors on board.
11 | 
12 | ### Reporting Bugs
13 | 
14 | Before reporting a new bug, please ensure that the issue has not already been reported. You can do this by searching through the existing issues in our GitHub repository. 
15 | 
16 | If you encounter a bug while using Fuji-Web and it has not been reported yet, please report it by creating a new issue. Be sure to include:
17 | 
18 | - A clear and descriptive title
19 | - A detailed description of the bug, including steps to reproduce it
20 | - Any relevant screenshots or error messages
21 | - Your Fuji-Web version and browser details
22 | 
23 | ### Suggesting Enhancements
24 | 
25 | We're always looking for ways to improve Fuji-Web. If you have an idea for a new feature or an enhancement to an existing one, please submit it as an issue, using a clear and concise title and description. Explain why this enhancement would be useful, and if possible, include examples of how it could be implemented.
26 | 
27 | ### Contributing Code
28 | 
29 | Confirm alignment on the proposed work. For small fixes or minor enhancements, make sure there is an open and accepted issue. For larger contributions, a design or plan should have been reviewed and agreed upon by the maintainers.
30 | 
31 | Before submitting your first code contribution, please make sure to:
32 | 
33 | 1. Clone the repository.
34 | 2. Follow the setup instructions in the README.md to get your development environment running.
35 | 4. Make your changes in a new git branch and test your changes locally.
36 | 5. Commit your changes using a clear and descriptive commit message.
37 | 6. Push your branch to GitHub and open a pull request against the `main` branch. In your pull request, include any relevant issue numbers and a description of the changes you've made.
38 | 
39 | ### Pull Request Guidelines
40 | 
41 | - Ensure that your code follows the project's coding conventions and is properly documented.
42 | - Include screenshots or animated GIFs in your pull request whenever possible, especially for UI-related changes.
43 | - Follow the [Pull Request Template](https://github.com/normal-computing/fuji-web/PULL_REQUEST_TEMPLATE.md) provided in the repository for the description of your pull request.
44 | 
45 | ### Code Review Process
46 | 
47 | After you submit a pull request, the project maintainers will review your proposed changes. This process helps to ensure the quality and consistency of the Fuji-Web codebase. The review may require some back-and-forth communication, so please be patient. We appreciate your contributions and will do our best to provide feedback and guidance as quickly as possible.
48 | 
49 | ## Community and Conduct
50 | 
51 | We are committed to providing a welcoming and inspiring community for all. We encourage all contributors to foster an open and welcoming environment, and to be respectful of differing viewpoints and experiences.
52 | 
53 | ## Acknowledgements
54 | 
55 | Your contributions help make Fuji-Web a better tool for everyone. We look forward to your ideas, feedback, and contributions. Thank you for being part of the Fuji-Web community! Happy contributing!
56 | 


--------------------------------------------------------------------------------
/CONTRIBUTING_KNOWLEDGE.md:
--------------------------------------------------------------------------------
 1 | # Contributing to Prior Knowledge Augmentation
 2 | 
 3 | Fuji-Web's Prior Knowledge Augmentation system is designed to enhance the tool's web navigation and task execution capabilities by leveraging a shared knowledge base. Contributions to this system help make Fuji-Web smarter and more capable.
 4 | 
 5 | ## What Kind of Knowledge Are We Looking For?
 6 | 
 7 | We seek knowledge that:
 8 | - Enhances the understanding of specific web pages or actions, making task execution more reliable.
 9 | - Includes insights into website layouts, common patterns, and user interfaces that are not immediately obvious.
10 | - Provides rules or annotations that help the AI better interpret the purpose of elements on a page.
11 | 
12 | For example, if a website has two buttons with the same name but different functionalities, it's crucial to describe in notes how to distinguish between them.
13 | 
14 | ## How to Add and Test New Knowledge
15 | 
16 | We offer two convenient ways to add and test new knowledge in real-time:
17 | - Via Form: Within the Fuji-Web UI settings, navigate to the "Custom Knowledge Base" and select "Add Host Knowledge with Form" to input new knowledge using a user-friendly form.
18 | - Via JSON: If you prefer to work directly with JSON, choose "Add Host Knowledge with JSON" to enter your custom knowledge.
19 | 
20 | You can test the new knowledge by running several tasks on the relevant web pages to ensure Fuji-Web behaves as expected.
21 | 
22 | Once you've tested various knowledge inputs and are satisfied with the new knowledge's performance, you can then copy that knowledge into the db.json file.
23 | 
24 | 1. Locate the `db.json` file in the `src/helpers/knowledge` directory of the Fuji-Web repository.
25 | 2. Add your knowledge in the JSON format, following the existing structure. `annotationRules` is optional.
26 |    ```json
27 |    {
28 |      "example.com": {
29 |        "rules": [
30 |          {
31 |            "regexes": ["regular expression to match pathname (not host name)"],
32 |            "knowledge": {
33 |              "notes": ["Your insights or notes about this page or action"],
34 |              "annotationRules": [
35 |                {
36 |                  "selector": "CSS selector",
37 |                  "allowInvisible": true,
38 |                  "allowCovered": true,
39 |                  "allowAriaHidden": true
40 |                }
41 |              ]
42 |            }
43 |          }
44 |        ]
45 |      }
46 |    }
47 |    ```
48 | 3. Please ensure your contributions are clear and concise, with `regexes` and `selector` accurately defined.
49 | 
50 | ## Submitting Your Contribution
51 | 
52 | Please check out the [Contribution Guide](CONTRIBUTING.md). Share your testing process and results in your pull request to help reviewers understand the impact of your contribution. Specifically, describe how the new knowledge help Fuji-Web achieve something it previously cannot perform correctly.
53 | 


--------------------------------------------------------------------------------
/PULL_REQUEST_TEMPLATE.md:
--------------------------------------------------------------------------------
 1 | ## Description
 2 | 
 3 | Please include a summary of the changes you have made. Describe any new features, bug fixes, or improvements you have introduced. If your changes address an open issue, please include a reference to it (e.g., `Fixes #123`).
 4 | 
 5 | ## Type of Change
 6 | 
 7 | Please delete options that are not relevant.
 8 | 
 9 | - [ ] New feature (non-breaking change which adds functionality)
10 | - [ ] Bug fix (non-breaking change which fixes an issue)
11 | - [ ] Documentation update
12 | - [ ] Code style update (formatting, renaming)
13 | - [ ] Refactoring (no functional changes, no API changes)
14 | - [ ] Build-related changes
15 | - [ ] Other (please describe):
16 | 
17 | ## How Has This Been Tested?
18 | 
19 | Please describe the tests that you ran to verify your changes. Provide instructions so we can reproduce the testing. Please also list any relevant details for your test configuration.
20 | 
21 | - [ ] Test A
22 | - [ ] Test B
23 | 
24 | ## Checklist:
25 | 
26 | Before submitting your pull request, please review the following checklist:
27 | 
28 | - [ ] I have proved my fix is effective or that my feature works.
29 | - [ ] I have performed a self-review of my own code.
30 | - [ ] I have commented on my code, particularly in hard-to-understand areas.
31 | - [ ] My changes generate no new warnings.
32 | 
33 | ## Screenshots (if applicable)
34 | 
35 | If your changes are visual and it helps to illustrate them, please include screenshots or GIFs here.
36 | 
37 | ## Additional Context
38 | 
39 | Provide any additional information about your pull request here.


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | <img src="public/icon-128.png" alt="Fuji-web Logo" width="100"/>
 2 | 
 3 | # Fuji-Web: AI based Full Browser Automation 🗻
 4 | 
 5 | Fuji-Web is an intelligent AI partner that understands the user’s intent, navigates websites autonomously, and executes tasks on the user’s behalf while explaining each action step.
 6 | 
 7 | ### Demo
 8 | https://github.com/normal-computing/fuji-web/assets/1001890/88a2fa12-31d9-4856-be67-27dcf9f1e634
 9 | 
10 | ## How does it work?
11 | 
12 | **Please read [our blog post](https://blog.normalcomputing.ai/posts/2024-05-22-introducing-fuji-web/fuji-web.html) for a demo video, benchmarks and deep-dive technical overview!**
13 | 
14 | ## Installing and Running
15 | 
16 | ### Download and Install the extension in your browser
17 | 
18 | 1. Go to the [releases page](https://github.com/normal-computing/fuji-web/releases), find the latest version of the extension and download "fuji-extension.zip".
19 | 2. Unzip the file.
20 | 3. Load your extension on Chrome by doing the following:
21 |    1. Navigate to `chrome://extensions/`
22 |    2. Toggle `Developer mode`
23 |    3. Click on `Load unpacked extension`
24 |    4. Select the unzipped folder
25 | 
26 | ### Use the extension
27 | 
28 | *Please note that you may need to refresh the page for the extension to work.*
29 | 
30 | 1. Find the Fuji icon in the top right corner of your browser and click on it to open the sidepanel.
31 | 2. Create or access an existing [OpenAI API Key](https://platform.openai.com/account/api-keys) or [Anthropic API key](https://console.anthropic.com/settings/keys) and paste it in the provided box. This key will be stored in your browser, and will not be uploaded to a third party.
32 | 3. Finally, navigate to a webpage you want Fuji-Web and type in the task you want it to perform.
33 | 
34 | _Note: all prompts (text and image) are sent directly to the API of your selection. Fuji-Web does not attempt to collect any information from you._
35 | 
36 | ### Build the extension
37 | 
38 | If you want to build the extension from source, follow these instructions:
39 | 
40 | 1. Ensure you have [Node.js](https://nodejs.org/). The development was done on Node v20 but it should work with some lower versions.
41 | 2. Clone this repository
42 | 3. Install `pnpm` globally: `npm install -g pnpm`
43 | 4. Run `pnpm install` 
44 | 5. Run `pnpm dev` to start the development server, or `pnpm build` to build the extension.
45 | 
46 | When loading the extension, you will need to load the `dist` folder created by the build process.
47 | 
48 | ## Roadmap
49 | 
50 | - Expose API for easy integration with browser automation frameworks (e.g. Puppeteer, Playwright, Selenium)
51 | - Add support for more complex & cross-tab workflows
52 | - Add support for more browsing behaviors (select from dropdown, extract content from entire page etc.)
53 | - Add support for saving workflows
54 | - Add support for sharing workflows & instructions with others
55 | - Create wikipedia-like knowledge base where users can work together to create knowledge that can improve the Fuji-Web's performance
56 | 
57 | ## Troubleshooting
58 | 
59 | Check out our [Troubleshooting Guide](TROUBLESHOOTING.md) for help with common problems.
60 | 
61 | ## Contributing
62 | 
63 | Interested in contributing to Fuji-Web? We'd love your help! Check out our [Contribution Guide](CONTRIBUTING.md) for guidelines on how to contribute, report bugs, suggest enhancements, and more. 
64 | 
65 | We also have set up a dedicated channel for Fuji-Web feedback on Discord at https://discord.gg/yfMjZ8udb5.
66 | 
67 | ## Credits
68 | 
69 | - Fuji-Web's image annotation method was inspired by Microsoft's [UFO paper](https://arxiv.org/abs/2402.07939).
70 | - Fuji as a tool that lives in the browser sidepanel was inspired by [TaxyAI's browser extension](https://github.com/TaxyAI/browser-extension). We also used some of its UI code.
71 | - The Chrome extension set-up leveraged an awesome boilerplate project [Jonghakseo/chrome-extension-boilerplate-react-vite](https://github.com/Jonghakseo/chrome-extension-boilerplate-react-vite).
72 | - The Fuji logo is from [Toss Face](https://emojipedia.org/toss-face) Emoji design set.
73 | 


--------------------------------------------------------------------------------
/TROUBLESHOOTING.md:
--------------------------------------------------------------------------------
 1 | # Troubleshooting Guide for Fuji-Web
 2 | 
 3 | This guide aims to help you diagnose and resolve common problems you might encounter. If you're still facing difficulties after following these steps, please reach out to us through our [GitHub Issues](https://github.com/normal-computing/fuji-web/issues).
 4 | 
 5 | 
 6 | ## Common Issues and Solutions
 7 | 
 8 | ### Extension Not Loading
 9 | 
10 | **Symptom**: The Fuji-Web extension doesn't appear in your browser or won't load.
11 | 
12 | **Solutions**:
13 | 1. Ensure your browser is compatible with Fuji-Web. Currently, Fuji-Web supports Chrome.
14 | 2. Verify that `Developer mode` is enabled in `chrome://extensions/`
15 | 3. (Only when you are building it from source) Make sure you've loaded the extension from the `dist` folder.
16 | 4. Restart your browser as this can resolve many loading issues.
17 | 
18 | ### API Key Problems
19 | 
20 | **Symptom**: Issues related to the OpenAI API key, such as authentication errors or features not working due to key issues. e.g., 404 The model `gpt-4-vision-preview` does not exist or you do not have access to it.
21 | 
22 | **Solutions**:
23 | 1. Make sure you entered a valid OpenAI API key. Note that keys can expire, so verify if yours is still active.
24 | 2. Ensure that your OpenAI API key has the necessary permissions. Visit https://platform.openai.com/playground/chat to check your permissions. Lack of credits can also restrict access to certain models.
25 | 
26 | ### Dom Actions Problems
27 | 
28 | **Symptom**: Fuji-Web did not perform dom actions properly.
29 | 
30 | **Solutions**:
31 | 1. Currently, Fuji-Web does not support running in the background. If you open a new tab or navigate away from the website that Fuji-Web is working on, some actions may fail. Please stay on the website where you execute Fuji-Web. 
32 | 
33 | ### Custom Knowledge Base Problems
34 | 
35 | **Symptom**: After adding custom knowledge, Fuji-Web crashed or did not perform according to the new knowledge about the active tab.
36 | 
37 | **Solutions**:
38 | 1. Currently, Fuji-Web only supports basic entry validation for custom knowledge. Make sure you entered the correct host name and correct regular expressions if using a custom URL Matching Pattern. 
39 | 
40 | ### Voice Mode Problems
41 | 
42 | **Symptom**: Fuji-Web did not capture speech.
43 | 
44 | **Solutions**:
45 | 1. Check if Fuji-Web has microphone access in the browser. When you turn on the voice mode in settings, the microphone access dialog should pop up in the browser; please select "allow".
46 | 2. If the dialog didn't pop up, right-click the Fuji-Web icon in the extensions group and select "View Web Permissions". Then select "Allow" for Microphone.
47 | 
48 | 
49 | ## Reporting New Issues
50 | 
51 | If you encounter a problem not covered in this guide, please help us by reporting it. Provide as much detail as possible, including steps to reproduce the issue, browser version, and any error messages you receive. Your reports are invaluable in helping us improve Fuji-Web.


--------------------------------------------------------------------------------
/commitlint.config.js:
--------------------------------------------------------------------------------
1 | export default { extends: ["@commitlint/config-conventional"] };
2 | 


--------------------------------------------------------------------------------
/manifest.js:
--------------------------------------------------------------------------------
 1 | import packageJson from "./package.json" with { type: "json" };
 2 | 
 3 | /**
 4 |  * After changing, please reload the extension at `chrome://extensions`
 5 |  * @type {chrome.runtime.ManifestV3}
 6 |  */
 7 | const manifest = {
 8 |   manifest_version: 3,
 9 |   name: "Fuji",
10 |   version: packageJson.version,
11 |   description: packageJson.description,
12 |   permissions: [
13 |     "storage",
14 |     "sidePanel",
15 |     "tabs",
16 |     "activeTab",
17 |     "scripting",
18 |     "clipboardWrite",
19 |     "debugger",
20 |     "management",
21 |   ],
22 |   host_permissions: ["<all_urls>"],
23 |   side_panel: {
24 |     default_path: "src/pages/sidepanel/index.html",
25 |   },
26 |   options_page: "src/pages/options/index.html",
27 |   background: {
28 |     service_worker: "src/pages/background/index.js",
29 |     type: "module",
30 |   },
31 |   action: {
32 |     // default_popup: 'src/pages/popup/index.html',
33 |     default_title: "Click to open side panel",
34 |     default_icon: "icon-128.png",
35 |   },
36 |   icons: {
37 |     128: "icon-128.png",
38 |   },
39 |   content_scripts: [
40 |     {
41 |       matches: ["http://*/*", "https://*/*", "<all_urls>"],
42 |       js: ["src/pages/content/index.js"],
43 |       css: ["assets/css/contentStyleGlobal.css"],
44 |       run_at: "document_start", // load the js as soon as possible since it does not rely on the DOM
45 |     },
46 |   ],
47 |   // devtools_page: "src/pages/devtools/index.html",
48 |   web_accessible_resources: [
49 |     {
50 |       resources: [
51 |         "assets/js/*.js",
52 |         "assets/css/*.css",
53 |         "assets/fonts/*",
54 |         "icon-128.png",
55 |         "src/pages/permission/index.html",
56 |         "src/pages/permission/requestPermissions.ts",
57 |       ],
58 |       matches: ["*://*/*"],
59 |     },
60 |   ],
61 | };
62 | 
63 | export default manifest;
64 | 


--------------------------------------------------------------------------------
/media/web-annotation.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/normal-computing/fuji-web/1aec509e4c437ca7764a5b4a56deaeba18691729/media/web-annotation.png


--------------------------------------------------------------------------------
/package.json:
--------------------------------------------------------------------------------
  1 | {
  2 |   "name": "fuji-web",
  3 |   "version": "2.2.0",
  4 |   "description": "A tool that redefines web interaction, making complex online tasks as simple as uttering a single command.",
  5 |   "repository": {
  6 |     "type": "git",
  7 |     "url": "https://github.com/normal-computing/fuji-web"
  8 |   },
  9 |   "scripts": {
 10 |     "build": "tsc --noEmit && vite build",
 11 |     "build:lib": "rollup --config rollup.lib.config.js && cp package.lib.json dist-lib/package.json",
 12 |     "build:firefox": "tsc --noEmit && cross-env __FIREFOX__=true vite build",
 13 |     "build:watch": "cross-env __DEV__=true vite build -w --mode development",
 14 |     "build:firefox:watch": "cross-env __DEV__=true __FIREFOX__=true vite build -w --mode development",
 15 |     "build:hmr": "rollup --config utils/reload/rollup.config.mjs",
 16 |     "wss": "node utils/reload/initReloadServer.js",
 17 |     "dev": "pnpm build:hmr && (run-p wss build:watch)",
 18 |     "dev:firefox": "pnpm build:hmr && (run-p wss build:firefox:watch)",
 19 |     "test": "exit 0",
 20 |     "commitlint": "commitlint --edit",
 21 |     "lint": "eslint src --ext .ts",
 22 |     "lint:fix": "pnpm lint --fix",
 23 |     "prettier": "prettier . --write",
 24 |     "prepare": "husky install"
 25 |   },
 26 |   "type": "module",
 27 |   "dependencies": {
 28 |     "@anthropic-ai/sdk": "^0.19.1",
 29 |     "@chakra-ui/icons": "^2.1.1",
 30 |     "@chakra-ui/react": "^2.8.2",
 31 |     "@emotion/react": "^11.11.4",
 32 |     "@emotion/styled": "^11.11.5",
 33 |     "@google/generative-ai": "^0.19.0",
 34 |     "accname": "^1.1.0",
 35 |     "construct-style-sheets-polyfill": "3.1.0",
 36 |     "formik": "^2.4.5",
 37 |     "immer": "^10.0.3",
 38 |     "lodash": "^4.17.21",
 39 |     "openai": "^4.60.0",
 40 |     "react": "18.2.0",
 41 |     "react-dom": "18.2.0",
 42 |     "react-icons": "^5.3.0",
 43 |     "react-syntax-highlighter": "^15.5.0",
 44 |     "react-textarea-autosize": "^8.4.1",
 45 |     "react-use": "^17.4.0",
 46 |     "tailwindcss": "^3.4.4",
 47 |     "webextension-polyfill": "0.10.0",
 48 |     "zod": "^3.23.8",
 49 |     "zod-validation-error": "^3.3.1",
 50 |     "zustand": "^4.5.2"
 51 |   },
 52 |   "devDependencies": {
 53 |     "@commitlint/cli": "19.5.0",
 54 |     "@commitlint/config-conventional": "18.1.0",
 55 |     "@jest/globals": "^29.7.0",
 56 |     "@rollup/plugin-typescript": "11.1.6",
 57 |     "@testing-library/react": "14.0.0",
 58 |     "@types/chrome": "0.0.251",
 59 |     "@types/dom-speech-recognition": "^0.0.4",
 60 |     "@types/jest": "29.5.7",
 61 |     "@types/lodash": "^4.17.7",
 62 |     "@types/node": "20.11.24",
 63 |     "@types/react": "18.2.37",
 64 |     "@types/react-dom": "18.2.22",
 65 |     "@types/ws": "8.5.10",
 66 |     "@typescript-eslint/eslint-plugin": "6.10.0",
 67 |     "@typescript-eslint/parser": "6.9.1",
 68 |     "@vitejs/plugin-react": "4.2.1",
 69 |     "autoprefixer": "^10.4.16",
 70 |     "chokidar": "3.6.0",
 71 |     "cross-env": "7.0.3",
 72 |     "eslint": "8.57.0",
 73 |     "eslint-config-airbnb-typescript": "17.1.0",
 74 |     "eslint-config-prettier": "9.1.0",
 75 |     "eslint-plugin-import": "2.29.1",
 76 |     "eslint-plugin-jsx-a11y": "6.8.0",
 77 |     "eslint-plugin-prettier": "5.1.3",
 78 |     "eslint-plugin-react": "7.35.0",
 79 |     "eslint-plugin-react-hooks": "4.6.0",
 80 |     "fs-extra": "11.1.1",
 81 |     "husky": "9.0.11",
 82 |     "jest": "29.7.0",
 83 |     "jest-environment-jsdom": "29.7.0",
 84 |     "lint-staged": "15.2.7",
 85 |     "npm-run-all": "4.1.5",
 86 |     "postcss": "^8.4.38",
 87 |     "prettier": "3.2.5",
 88 |     "rollup": "4.17.2",
 89 |     "rollup-plugin-dts": "^6.1.1",
 90 |     "rollup-plugin-esbuild": "^6.1.1",
 91 |     "sass": "1.72.0",
 92 |     "ts-jest": "29.2.5",
 93 |     "tslib": "2.6.2",
 94 |     "typescript": "5.5.3",
 95 |     "vite": "5.2.14",
 96 |     "ws": "8.18.0"
 97 |   },
 98 |   "lint-staged": {
 99 |     "*.{js,jsx,ts,tsx}": [
100 |       "prettier --write",
101 |       "eslint --fix"
102 |     ]
103 |   },
104 |   "packageManager": "pnpm@9.13.2"
105 | }
106 | 


--------------------------------------------------------------------------------
/package.lib.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "web-wand-lib",
 3 |   "version": "2.0.3",
 4 |   "description": "Helper library for Web Wand",
 5 |   "repository": {
 6 |     "type": "git",
 7 |     "url": "https://github.com/normal-computing/web-wand"
 8 |   }
 9 | }
10 | 


--------------------------------------------------------------------------------
/postcss.config.js:
--------------------------------------------------------------------------------
1 | export default {
2 |   plugins: {
3 |     tailwindcss: {},
4 |     autoprefixer: {},
5 |   },
6 | };
7 | 


--------------------------------------------------------------------------------
/public/icon-128.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/normal-computing/fuji-web/1aec509e4c437ca7764a5b4a56deaeba18691729/public/icon-128.png


--------------------------------------------------------------------------------
/rollup.lib.config.js:
--------------------------------------------------------------------------------
 1 | import dts from "rollup-plugin-dts";
 2 | import esbuild from "rollup-plugin-esbuild";
 3 | import { resolve, dirname } from "path";
 4 | import { fileURLToPath } from "url";
 5 | 
 6 | const __dirname = dirname(fileURLToPath(import.meta.url));
 7 | 
 8 | const OUT_DIR = "dist-lib";
 9 | const rootDir = resolve(__dirname);
10 | const srcDir = resolve(rootDir, "src");
11 | const pagesDir = resolve(srcDir, "pages");
12 | 
13 | function createConfigPair(name, path) {
14 |   return [
15 |     {
16 |       input: path,
17 |       plugins: [esbuild()],
18 |       output: [
19 |         {
20 |           file: `${OUT_DIR}/${name}.js`,
21 |           format: "cjs",
22 |           sourcemap: true,
23 |           exports: "auto",
24 |         },
25 |       ],
26 |     },
27 |     {
28 |       input: path,
29 |       plugins: [dts()],
30 |       output: {
31 |         file: `${OUT_DIR}/${name}.d.ts`,
32 |         format: "es",
33 |       },
34 |     },
35 |   ];
36 | }
37 | 
38 | export default [
39 |   ...createConfigPair(
40 |     "domOperations",
41 |     resolve(pagesDir, "content", "domOperations.ts"),
42 |   ),
43 |   ...createConfigPair("helpers", resolve(srcDir, "helpers", "index.ts")),
44 | ];
45 | 


--------------------------------------------------------------------------------
/src/assets/img/logo.svg:
--------------------------------------------------------------------------------
1 | <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 841.9 595.3">
2 |     <g fill="#61DAFB">
3 |         <path d="M666.3 296.5c0-32.5-40.7-63.3-103.1-82.4 14.4-63.6 8-114.2-20.2-130.4-6.5-3.8-14.1-5.6-22.4-5.6v22.3c4.6 0 8.3.9 11.4 2.6 13.6 7.8 19.5 37.5 14.9 75.7-1.1 9.4-2.9 19.3-5.1 29.4-19.6-4.8-41-8.5-63.5-10.9-13.5-18.5-27.5-35.3-41.6-50 32.6-30.3 63.2-46.9 84-46.9V78c-27.5 0-63.5 19.6-99.9 53.6-36.4-33.8-72.4-53.2-99.9-53.2v22.3c20.7 0 51.4 16.5 84 46.6-14 14.7-28 31.4-41.3 49.9-22.6 2.4-44 6.1-63.6 11-2.3-10-4-19.7-5.2-29-4.7-38.2 1.1-67.9 14.6-75.8 3-1.8 6.9-2.6 11.5-2.6V78.5c-8.4 0-16 1.8-22.6 5.6-28.1 16.2-34.4 66.7-19.9 130.1-62.2 19.2-102.7 49.9-102.7 82.3 0 32.5 40.7 63.3 103.1 82.4-14.4 63.6-8 114.2 20.2 130.4 6.5 3.8 14.1 5.6 22.5 5.6 27.5 0 63.5-19.6 99.9-53.6 36.4 33.8 72.4 53.2 99.9 53.2 8.4 0 16-1.8 22.6-5.6 28.1-16.2 34.4-66.7 19.9-130.1 62-19.1 102.5-49.9 102.5-82.3zm-130.2-66.7c-3.7 12.9-8.3 26.2-13.5 39.5-4.1-8-8.4-16-13.1-24-4.6-8-9.5-15.8-14.4-23.4 14.2 2.1 27.9 4.7 41 7.9zm-45.8 106.5c-7.8 13.5-15.8 26.3-24.1 38.2-14.9 1.3-30 2-45.2 2-15.1 0-30.2-.7-45-1.9-8.3-11.9-16.4-24.6-24.2-38-7.6-13.1-14.5-26.4-20.8-39.8 6.2-13.4 13.2-26.8 20.7-39.9 7.8-13.5 15.8-26.3 24.1-38.2 14.9-1.3 30-2 45.2-2 15.1 0 30.2.7 45 1.9 8.3 11.9 16.4 24.6 24.2 38 7.6 13.1 14.5 26.4 20.8 39.8-6.3 13.4-13.2 26.8-20.7 39.9zm32.3-13c5.4 13.4 10 26.8 13.8 39.8-13.1 3.2-26.9 5.9-41.2 8 4.9-7.7 9.8-15.6 14.4-23.7 4.6-8 8.9-16.1 13-24.1zM421.2 430c-9.3-9.6-18.6-20.3-27.8-32 9 .4 18.2.7 27.5.7 9.4 0 18.7-.2 27.8-.7-9 11.7-18.3 22.4-27.5 32zm-74.4-58.9c-14.2-2.1-27.9-4.7-41-7.9 3.7-12.9 8.3-26.2 13.5-39.5 4.1 8 8.4 16 13.1 24 4.7 8 9.5 15.8 14.4 23.4zM420.7 163c9.3 9.6 18.6 20.3 27.8 32-9-.4-18.2-.7-27.5-.7-9.4 0-18.7.2-27.8.7 9-11.7 18.3-22.4 27.5-32zm-74 58.9c-4.9 7.7-9.8 15.6-14.4 23.7-4.6 8-8.9 16-13 24-5.4-13.4-10-26.8-13.8-39.8 13.1-3.1 26.9-5.8 41.2-7.9zm-90.5 125.2c-35.4-15.1-58.3-34.9-58.3-50.6 0-15.7 22.9-35.6 58.3-50.6 8.6-3.7 18-7 27.7-10.1 5.7 19.6 13.2 40 22.5 60.9-9.2 20.8-16.6 41.1-22.2 60.6-9.9-3.1-19.3-6.5-28-10.2zM310 490c-13.6-7.8-19.5-37.5-14.9-75.7 1.1-9.4 2.9-19.3 5.1-29.4 19.6 4.8 41 8.5 63.5 10.9 13.5 18.5 27.5 35.3 41.6 50-32.6 30.3-63.2 46.9-84 46.9-4.5-.1-8.3-1-11.3-2.7zm237.2-76.2c4.7 38.2-1.1 67.9-14.6 75.8-3 1.8-6.9 2.6-11.5 2.6-20.7 0-51.4-16.5-84-46.6 14-14.7 28-31.4 41.3-49.9 22.6-2.4 44-6.1 63.6-11 2.3 10.1 4.1 19.8 5.2 29.1zm38.5-66.7c-8.6 3.7-18 7-27.7 10.1-5.7-19.6-13.2-40-22.5-60.9 9.2-20.8 16.6-41.1 22.2-60.6 9.9 3.1 19.3 6.5 28.1 10.2 35.4 15.1 58.3 34.9 58.3 50.6-.1 15.7-23 35.6-58.4 50.6zM320.8 78.4z"/>
4 |         <circle cx="420.9" cy="296.5" r="45.7"/>
5 |         <path d="M520.5 78.1z"/>
6 |     </g>
7 | </svg>
8 | 


--------------------------------------------------------------------------------
/src/assets/style/theme.scss:
--------------------------------------------------------------------------------
1 | .crx-class {
2 |   color: pink;
3 | }
4 | 


--------------------------------------------------------------------------------
/src/common/App.tsx:
--------------------------------------------------------------------------------
 1 | import {
 2 |   Link,
 3 |   Box,
 4 |   ChakraProvider,
 5 |   Heading,
 6 |   HStack,
 7 |   IconButton,
 8 |   Icon,
 9 | } from "@chakra-ui/react";
10 | import { SettingsIcon } from "@chakra-ui/icons";
11 | import { FaDiscord, FaGithub } from "react-icons/fa6";
12 | import { useState } from "react";
13 | import { useAppState } from "../state/store";
14 | import SetAPIKey from "./settings/SetAPIKey";
15 | import TaskUI from "./TaskUI";
16 | import Settings from "./Settings";
17 | 
18 | const App = () => {
19 |   const hasAPIKey = useAppState(
20 |     (state) => state.settings.anthropicKey || state.settings.openAIKey,
21 |   );
22 |   const [inSettingsView, setInSettingsView] = useState(false);
23 | 
24 |   return (
25 |     <ChakraProvider>
26 |       <Box p="8" pb="24" fontSize="lg" w="full">
27 |         <HStack mb={4} alignItems="center">
28 |           <Heading as="h1" size="lg" flex={1}>
29 |             Fuji 🗻
30 |           </Heading>
31 |           {hasAPIKey && (
32 |             <IconButton
33 |               icon={<SettingsIcon />}
34 |               onClick={() => setInSettingsView(true)}
35 |               aria-label="open settings"
36 |             />
37 |           )}
38 |         </HStack>
39 |         {hasAPIKey ? (
40 |           inSettingsView ? (
41 |             <Settings setInSettingsView={setInSettingsView} />
42 |           ) : (
43 |             <TaskUI />
44 |           )
45 |         ) : (
46 |           <SetAPIKey asInitializerView />
47 |         )}
48 |       </Box>
49 |       <Box
50 |         px="8"
51 |         pos="fixed"
52 |         w="100%"
53 |         bottom={0}
54 |         zIndex={2}
55 |         as="footer"
56 |         backdropFilter="auto"
57 |         backdropBlur="6px"
58 |         backgroundColor="rgba(255, 255, 255, 0.6)"
59 |       >
60 |         <HStack
61 |           columnGap="1.5rem"
62 |           rowGap="0.5rem"
63 |           fontSize="md"
64 |           borderTop="1px dashed gray"
65 |           py="3"
66 |           justify="center"
67 |           shouldWrapChildren
68 |           wrap="wrap"
69 |         >
70 |           <Link
71 |             href="https://github.com/normal-computing/fuji-web#readme"
72 |             isExternal
73 |           >
74 |             About this project
75 |           </Link>
76 |           <Link href="https://forms.gle/isLeGyUvoKGiqT8W8" isExternal>
77 |             Leave Feedback
78 |           </Link>
79 |           <Link href="https://github.com/normal-computing/fuji-web" isExternal>
80 |             GitHub <Icon verticalAlign="text-bottom" as={FaGithub} />
81 |           </Link>
82 |           <Link href="https://discord.gg/yfMjZ8udb5" isExternal>
83 |             Join Our Discord <Icon verticalAlign="text-bottom" as={FaDiscord} />
84 |           </Link>
85 |         </HStack>
86 |       </Box>
87 |     </ChakraProvider>
88 |   );
89 | };
90 | 
91 | export default App;
92 | 


--------------------------------------------------------------------------------
/src/common/AutosizeTextarea.tsx:
--------------------------------------------------------------------------------
 1 | import { Textarea, TextareaProps } from "@chakra-ui/react";
 2 | import ResizeTextarea from "react-textarea-autosize";
 3 | import React from "react";
 4 | 
 5 | const AutosizeTextarea = React.forwardRef<HTMLTextAreaElement, TextareaProps>(
 6 |   (props, ref) => {
 7 |     return (
 8 |       <Textarea
 9 |         minH="unset"
10 |         overflow="hidden"
11 |         w="100%"
12 |         resize="none"
13 |         ref={ref}
14 |         minRows={4}
15 |         as={ResizeTextarea}
16 |         {...props}
17 |       />
18 |     );
19 |   },
20 | );
21 | 
22 | AutosizeTextarea.displayName = "AutosizeTextarea";
23 | 
24 | export default AutosizeTextarea;
25 | 


--------------------------------------------------------------------------------
/src/common/CopyButton.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { CopyIcon } from "@chakra-ui/icons";
 3 | import { useToast } from "@chakra-ui/react";
 4 | import { callRPC } from "../helpers/rpc/pageRPC";
 5 | 
 6 | export default function CopyButton(props: { text: string }) {
 7 |   const toast = useToast();
 8 | 
 9 |   return (
10 |     <CopyIcon
11 |       cursor="pointer"
12 |       color="gray.500"
13 |       _hover={{ color: "gray.700" }}
14 |       onClick={async (event) => {
15 |         try {
16 |           event.preventDefault();
17 |           await callRPC("copyToClipboard", [props.text]);
18 |           toast({
19 |             title: "Copied to clipboard",
20 |             status: "success",
21 |             duration: 3000,
22 |             isClosable: true,
23 |           });
24 |         } catch (e) {
25 |           console.error(e);
26 |           toast({
27 |             title: "Error",
28 |             description: "Could not copy to clipboard",
29 |             status: "error",
30 |             duration: 5000,
31 |             isClosable: true,
32 |           });
33 |         }
34 |       }}
35 |     />
36 |   );
37 | }
38 | 


--------------------------------------------------------------------------------
/src/common/CustomKnowledgeBase/DefaultKnowledge.tsx:
--------------------------------------------------------------------------------
 1 | import {
 2 |   Box,
 3 |   Button,
 4 |   Modal,
 5 |   ModalBody,
 6 |   ModalCloseButton,
 7 |   ModalContent,
 8 |   ModalFooter,
 9 |   ModalHeader,
10 |   ModalOverlay,
11 |   useDisclosure,
12 | } from "@chakra-ui/react";
13 | import { fetchAllDefaultKnowledge } from "@root/src/helpers/knowledge";
14 | import HostKnowledge from "./HostKnowledge";
15 | 
16 | const DefaultKnowledge = () => {
17 |   const { isOpen, onOpen, onClose } = useDisclosure();
18 |   const defaultKnowledgeBase = fetchAllDefaultKnowledge();
19 |   // some default knowledge may not have notes, filter them out
20 |   const hosts = Object.keys(defaultKnowledgeBase).filter((host) =>
21 |     defaultKnowledgeBase[host]?.rules?.some(
22 |       (rule) => (rule.knowledge?.notes?.length ?? 0) > 0,
23 |     ),
24 |   );
25 |   return (
26 |     <>
27 |       <Button size="sm" variant="link" colorScheme="blue" onClick={onOpen}>
28 |         View Built-in Instructions
29 |       </Button>
30 |       <Modal
31 |         isOpen={isOpen}
32 |         onClose={onClose}
33 |         size="xl"
34 |         scrollBehavior="inside"
35 |       >
36 |         <ModalOverlay />
37 |         <ModalContent>
38 |           <ModalHeader>Default Instructions</ModalHeader>
39 |           <ModalCloseButton />
40 |           <ModalBody>
41 |             {hosts.map((host) => (
42 |               <Box
43 |                 key={host}
44 |                 w="full"
45 |                 p={4}
46 |                 borderWidth="1px"
47 |                 borderRadius="lg"
48 |                 mb={3}
49 |               >
50 |                 <HostKnowledge host={host} isDefaultKnowledge={true} />
51 |               </Box>
52 |             ))}
53 |           </ModalBody>
54 |           <ModalFooter>
55 |             <Button onClick={onClose}>Close</Button>
56 |           </ModalFooter>
57 |         </ModalContent>
58 |       </Modal>
59 |     </>
60 |   );
61 | };
62 | 
63 | export default DefaultKnowledge;
64 | 


--------------------------------------------------------------------------------
/src/common/CustomKnowledgeBase/DuplicateKnowledgeAlert.tsx:
--------------------------------------------------------------------------------
 1 | import React, { useRef } from "react";
 2 | import {
 3 |   AlertDialog,
 4 |   AlertDialogBody,
 5 |   AlertDialogFooter,
 6 |   AlertDialogHeader,
 7 |   AlertDialogContent,
 8 |   AlertDialogOverlay,
 9 |   Button,
10 | } from "@chakra-ui/react";
11 | 
12 | type DuplicateKnowledgeAlertProps = {
13 |   host: string;
14 |   isOpen: boolean;
15 |   onSave: () => void;
16 |   onClose: () => void;
17 | };
18 | 
19 | const DuplicateKnowledgeAlert = ({
20 |   host,
21 |   isOpen,
22 |   onSave,
23 |   onClose,
24 | }: DuplicateKnowledgeAlertProps) => {
25 |   const cancelRef = useRef<HTMLButtonElement>(null);
26 | 
27 |   return (
28 |     <AlertDialog
29 |       isOpen={isOpen}
30 |       onClose={onClose}
31 |       leastDestructiveRef={cancelRef}
32 |       isCentered
33 |     >
34 |       <AlertDialogOverlay>
35 |         <AlertDialogContent>
36 |           <AlertDialogHeader fontSize="lg" fontWeight="bold">
37 |             Save Knowledge
38 |           </AlertDialogHeader>
39 | 
40 |           <AlertDialogBody fontSize="md">
41 |             {host} already exists in the knowledge base. Saving will overwrite
42 |             it. Do you want to proceed?
43 |           </AlertDialogBody>
44 | 
45 |           <AlertDialogFooter>
46 |             <Button size="sm" colorScheme="blue" onClick={onSave} mr={3}>
47 |               Save
48 |             </Button>
49 |             <Button size="sm" ref={cancelRef} onClick={onClose}>
50 |               Cancel
51 |             </Button>
52 |           </AlertDialogFooter>
53 |         </AlertDialogContent>
54 |       </AlertDialogOverlay>
55 |     </AlertDialog>
56 |   );
57 | };
58 | 
59 | export default DuplicateKnowledgeAlert;
60 | 


--------------------------------------------------------------------------------
/src/common/CustomKnowledgeBase/HostKnowledge.tsx:
--------------------------------------------------------------------------------
  1 | import { DeleteIcon, EditIcon } from "@chakra-ui/icons";
  2 | import {
  3 |   Heading,
  4 |   Accordion,
  5 |   AccordionItem,
  6 |   AccordionButton,
  7 |   AccordionPanel,
  8 |   AccordionIcon,
  9 |   IconButton,
 10 |   Tooltip,
 11 |   Flex,
 12 |   Box,
 13 | } from "@chakra-ui/react";
 14 | import { fetchAllDefaultKnowledge } from "../../helpers/knowledge";
 15 | import { useAppState } from "@root/src/state/store";
 16 | import Notes from "./Notes";
 17 | 
 18 | type HostKnowledgeProps = {
 19 |   host: string;
 20 |   isDefaultKnowledge: boolean;
 21 |   onEdit?: (host: string) => void;
 22 | };
 23 | 
 24 | const HostKnowledge = ({
 25 |   host,
 26 |   isDefaultKnowledge,
 27 |   onEdit,
 28 | }: HostKnowledgeProps) => {
 29 |   const updateSettings = useAppState((state) => state.settings.actions.update);
 30 |   const customKnowledgeBase = useAppState(
 31 |     (state) => state.settings.customKnowledgeBase,
 32 |   );
 33 |   const knowledgeBase = isDefaultKnowledge
 34 |     ? fetchAllDefaultKnowledge()
 35 |     : customKnowledgeBase;
 36 | 
 37 |   if (knowledgeBase[host] === undefined) {
 38 |     return null;
 39 |   }
 40 |   const rules = knowledgeBase[host].rules;
 41 |   if (rules === undefined) {
 42 |     return null;
 43 |   }
 44 | 
 45 |   const handleRemove = () => {
 46 |     const newKnowledge = { ...knowledgeBase };
 47 |     delete newKnowledge[host];
 48 |     updateSettings({ customKnowledgeBase: newKnowledge });
 49 |   };
 50 | 
 51 |   // temporarily disable copy feature
 52 |   /*
 53 |   const getJsonString = (): string => {
 54 |     return JSON.stringify(knowledgeBase[host], null, 2);
 55 |   };
 56 | 
 57 |   const handleCopy = async () => {
 58 |     try {
 59 |       await navigator.clipboard.writeText(getJsonString());
 60 |       toast({
 61 |         title: "Copied",
 62 |         description: "Knowledge has been copied to clipboard.",
 63 |         status: "success",
 64 |         duration: 2000,
 65 |         isClosable: true,
 66 |       });
 67 |     } catch (err) {
 68 |       toast({
 69 |         title: "Error",
 70 |         description: "Failed to copy knowledge to clipboard.",
 71 |         status: "error",
 72 |         duration: 2000,
 73 |         isClosable: true,
 74 |       });
 75 |     }
 76 |   };
 77 |   */
 78 | 
 79 |   return (
 80 |     <>
 81 |       <Flex alignItems="flex-start" mb="2">
 82 |         <Heading
 83 |           as="h5"
 84 |           size="sm"
 85 |           flex="1"
 86 |           overflowWrap="anywhere"
 87 |           lineHeight="1.5rem"
 88 |         >
 89 |           {!isDefaultKnowledge && (
 90 |             <Box
 91 |               position="relative"
 92 |               style={{ float: "right", marginTop: "-4px" }}
 93 |             >
 94 |               <Tooltip label="Edit knowledge">
 95 |                 <IconButton
 96 |                   aria-label="Edit knowledge"
 97 |                   icon={<EditIcon />}
 98 |                   size="sm"
 99 |                   variant="ghost"
100 |                   onClick={() => {
101 |                     if (onEdit) onEdit(host);
102 |                   }}
103 |                 />
104 |               </Tooltip>
105 |               <Tooltip label="Remove knowledge">
106 |                 <IconButton
107 |                   aria-label="Remove knowledge"
108 |                   icon={<DeleteIcon />}
109 |                   size="sm"
110 |                   variant="ghost"
111 |                   onClick={handleRemove}
112 |                 />
113 |               </Tooltip>
114 |             </Box>
115 |           )}
116 |           {host}
117 |         </Heading>
118 |       </Flex>
119 |       <Accordion allowToggle>
120 |         {rules.map((rule, ruleIndex) => {
121 |           // Skip rules without notes
122 |           if (
123 |             rule.knowledge === undefined ||
124 |             rule.knowledge.notes === undefined ||
125 |             rule.knowledge.notes.length === 0
126 |           ) {
127 |             return null;
128 |           }
129 |           return (
130 |             <AccordionItem key={ruleIndex} backgroundColor="white">
131 |               <h2>
132 |                 <AccordionButton>
133 |                   <Box flex="1" textAlign="left">
134 |                     Instructions Set {ruleIndex + 1}
135 |                   </Box>
136 |                   <AccordionIcon />
137 |                 </AccordionButton>
138 |               </h2>
139 |               <AccordionPanel pb={4}>
140 |                 <Notes notes={rule.knowledge.notes} />
141 |               </AccordionPanel>
142 |             </AccordionItem>
143 |           );
144 |         })}
145 |       </Accordion>
146 |     </>
147 |   );
148 | };
149 | 
150 | export default HostKnowledge;
151 | 


--------------------------------------------------------------------------------
/src/common/CustomKnowledgeBase/NewKnowledgeJson.tsx:
--------------------------------------------------------------------------------
  1 | import {
  2 |   Button,
  3 |   Modal,
  4 |   ModalBody,
  5 |   ModalCloseButton,
  6 |   ModalContent,
  7 |   ModalFooter,
  8 |   ModalHeader,
  9 |   ModalOverlay,
 10 |   Textarea,
 11 |   useToast,
 12 | } from "@chakra-ui/react";
 13 | import { useAppState } from "@root/src/state/store";
 14 | import { useState } from "react";
 15 | import DuplicateKnowledgeAlert from "./DuplicateKnowledgeAlert";
 16 | import { type Data } from "@root/src/helpers/knowledge";
 17 | 
 18 | type NewKnowledgeJsonProps = {
 19 |   isOpen: boolean;
 20 |   onClose: () => void;
 21 | };
 22 | 
 23 | const NewKnowledgeJson = ({ isOpen, onClose }: NewKnowledgeJsonProps) => {
 24 |   const [jsonInput, setJsonInput] = useState("");
 25 |   const [showDuplicateAlert, setShowDuplicateAlert] = useState(false);
 26 |   const [newCustomKnowledge, setNewCustomKnowledge] = useState<Data | null>(
 27 |     null,
 28 |   );
 29 |   const [duplicatedHosts, setduplicatedHosts] = useState<Data | null>(null);
 30 |   const toast = useToast();
 31 |   const updateSettings = useAppState((state) => state.settings.actions.update);
 32 |   const customKnowledgeBase = useAppState(
 33 |     (state) => state.settings.customKnowledgeBase,
 34 |   );
 35 | 
 36 |   function saveKnowledges() {
 37 |     const newKnowledge = { ...customKnowledgeBase, ...newCustomKnowledge };
 38 |     updateSettings({ customKnowledgeBase: newKnowledge });
 39 |   }
 40 | 
 41 |   const validateJSON = () => {
 42 |     try {
 43 |       const parsedJson = JSON.parse(jsonInput);
 44 |       const dupHosts: Data = {};
 45 |       const hostsKnowledges: Data = {};
 46 |       Object.keys(parsedJson).forEach((host: string) => {
 47 |         const hostKnowledge = parsedJson[host];
 48 |         // Basic validation for the structure
 49 |         if (!hostKnowledge.rules || !Array.isArray(hostKnowledge.rules)) {
 50 |           throw new Error(`Invalid structure for host: ${host}`);
 51 |         }
 52 |         // Further validation can be added here, e.g., checking if regex is valid, checking each rule's structure
 53 | 
 54 |         const hostName = host.startsWith("www.") ? host.slice(4) : host;
 55 |         hostsKnowledges[hostName] = hostKnowledge;
 56 |         if (hostName in customKnowledgeBase) {
 57 |           dupHosts[hostName] = hostKnowledge;
 58 |         }
 59 |       });
 60 |       setNewCustomKnowledge(hostsKnowledges);
 61 |       if (Object.keys(dupHosts).length > 0) {
 62 |         setduplicatedHosts(dupHosts);
 63 |         setShowDuplicateAlert(true);
 64 |       } else {
 65 |         saveKnowledges();
 66 |         setJsonInput("");
 67 |         onClose();
 68 |       }
 69 |     } catch (error) {
 70 |       console.error("Failed to save JSON", error);
 71 |       toast({
 72 |         title: "Error",
 73 |         description: `"Failed to save JSON: ${error}`,
 74 |         status: "error",
 75 |         duration: 5000,
 76 |         isClosable: true,
 77 |       });
 78 |     }
 79 |   };
 80 | 
 81 |   const duplicatedHostsNames = (): string => {
 82 |     let names = "";
 83 |     if (duplicatedHosts) {
 84 |       Object.keys(duplicatedHosts).forEach((host) => {
 85 |         names = names + host;
 86 |       });
 87 |     }
 88 |     return names;
 89 |   };
 90 | 
 91 |   function handleAlertOnSave(): void {
 92 |     saveKnowledges();
 93 |     setduplicatedHosts(null);
 94 |     setShowDuplicateAlert(false);
 95 |     setJsonInput("");
 96 |     onClose();
 97 |   }
 98 | 
 99 |   return (
100 |     <Modal isOpen={isOpen} onClose={onClose}>
101 |       <ModalOverlay />
102 |       <ModalContent>
103 |         <ModalCloseButton />
104 |         <DuplicateKnowledgeAlert
105 |           host={duplicatedHostsNames()}
106 |           isOpen={showDuplicateAlert}
107 |           onSave={handleAlertOnSave}
108 |           onClose={() => setShowDuplicateAlert(false)}
109 |         />
110 |         <ModalHeader>New Host Knowledge</ModalHeader>
111 |         <ModalBody>
112 |           <Textarea
113 |             value={jsonInput}
114 |             onChange={(e) => setJsonInput(e.target.value)}
115 |             placeholder="Enter knowledge in JSON format"
116 |             height="auto"
117 |             rows={20}
118 |           />
119 |         </ModalBody>
120 |         <ModalFooter>
121 |           <Button colorScheme="blue" mr={3} onClick={validateJSON}>
122 |             Save
123 |           </Button>
124 |           <Button onClick={onClose}>Cancel</Button>
125 |         </ModalFooter>
126 |       </ModalContent>
127 |     </Modal>
128 |   );
129 | };
130 | 
131 | export default NewKnowledgeJson;
132 | 


--------------------------------------------------------------------------------
/src/common/CustomKnowledgeBase/Notes.tsx:
--------------------------------------------------------------------------------
 1 | import { UnorderedList, ListItem } from "@chakra-ui/react";
 2 | 
 3 | export default function Notes({ notes }: { notes: string[] | undefined }) {
 4 |   if (!notes || notes.length === 0) {
 5 |     return null;
 6 |   }
 7 |   return (
 8 |     <UnorderedList fontSize="0.8rem" styleType="circle">
 9 |       {notes.map((note, index) => (
10 |         <ListItem key={index}>{note}</ListItem>
11 |       ))}
12 |     </UnorderedList>
13 |   );
14 | }
15 | 


--------------------------------------------------------------------------------
/src/common/CustomKnowledgeBase/index.tsx:
--------------------------------------------------------------------------------
 1 | import React, { useState } from "react";
 2 | import { Button, Text, VStack, Box } from "@chakra-ui/react";
 3 | import { useAppState } from "@root/src/state/store";
 4 | import NewKnowledgeForm from "./NewKnowledgeForm";
 5 | import { type EditingData } from "../../helpers/knowledge";
 6 | import DefaultKnowledge from "./DefaultKnowledge";
 7 | import HostKnowledge from "./HostKnowledge";
 8 | // import NewKnowledgeJson from "./NewKnowledgeJson";
 9 | import { findActiveTab } from "../../helpers/browserUtils";
10 | 
11 | const CustomKnowledgeBase = () => {
12 |   const [isFormOpen, setIsFormOpen] = useState(false);
13 |   const [editKnowledge, setEditKnowledge] = useState<EditingData | undefined>(
14 |     undefined,
15 |   );
16 |   const customKnowledgeBase = useAppState(
17 |     (state) => state.settings.customKnowledgeBase,
18 |   );
19 |   // const {
20 |   //   isOpen: isJsonInputOpen,
21 |   //   onOpen: openJsonInput,
22 |   //   onClose: closeJsonInput,
23 |   // } = useDisclosure();
24 |   const [defaultHost, setDefaultHost] = useState("");
25 |   const [currentURL, setCurrentUrl] = useState("");
26 | 
27 |   const openForm = async () => {
28 |     const tab = await findActiveTab();
29 |     if (tab && tab.url) {
30 |       setCurrentUrl(tab.url);
31 |       if (tab.url.startsWith("chrome")) {
32 |         setDefaultHost("");
33 |       } else {
34 |         const url = new URL(tab.url);
35 |         const host = url.hostname.replace(/^www\./, "");
36 |         setDefaultHost(host);
37 |       }
38 |     }
39 |     setIsFormOpen(true);
40 |   };
41 | 
42 |   const closeForm = () => {
43 |     setEditKnowledge(undefined);
44 |     setIsFormOpen(false);
45 |   };
46 | 
47 |   const openEditForm = (host: string) => {
48 |     const originalRules = customKnowledgeBase[host].rules;
49 | 
50 |     const transformedRules = originalRules?.map((rule) => ({
51 |       ...rule,
52 |       regexType: "custom",
53 |     }));
54 | 
55 |     if (transformedRules) {
56 |       setEditKnowledge({
57 |         host,
58 |         rules: transformedRules,
59 |       });
60 |     }
61 | 
62 |     openForm();
63 |   };
64 | 
65 |   return (
66 |     <VStack spacing={4}>
67 |       <DefaultKnowledge />
68 |       {Object.keys(customKnowledgeBase).length > 0 ? (
69 |         Object.keys(customKnowledgeBase).map((host) => (
70 |           <Box key={host} w="full" p={4} borderWidth="1px" borderRadius="lg">
71 |             <HostKnowledge
72 |               host={host}
73 |               isDefaultKnowledge={false}
74 |               onEdit={openEditForm}
75 |             />
76 |           </Box>
77 |         ))
78 |       ) : (
79 |         <Text>No instructions found</Text>
80 |       )}
81 |       <Button onClick={openForm}>Add Instructions</Button>
82 |       {/* <Button onClick={openJsonInput}>Add Host Knowledge with JSON</Button> */}
83 |       <NewKnowledgeForm
84 |         isOpen={isFormOpen}
85 |         isEditMode={!!editKnowledge}
86 |         editKnowledge={editKnowledge}
87 |         closeForm={closeForm}
88 |         defaultHost={defaultHost}
89 |         currentURL={currentURL}
90 |       />
91 |       {/* <NewKnowledgeJson isOpen={isJsonInputOpen} onClose={closeJsonInput} /> */}
92 |     </VStack>
93 |   );
94 | };
95 | 
96 | export default CustomKnowledgeBase;
97 | 


--------------------------------------------------------------------------------
/src/common/RecommendedTasks.tsx:
--------------------------------------------------------------------------------
 1 | import { Button, VStack, Text } from "@chakra-ui/react";
 2 | import { useAppState } from "../state/store";
 3 | 
 4 | const tasks = [
 5 |   'Post on twitter.com with content "An automated post from Fuji-Web by @NormalComputing! :)" If I\'m not logged in, fail the task and wait for me to log in.',
 6 |   "Find a book about AI and add a physical copy to cart on Amazon.com. Pick the cheaper one from paperback and hardcover.",
 7 | ];
 8 | 
 9 | const RecommendedTasks = ({
10 |   runTask,
11 | }: {
12 |   runTask: (instructions: string) => void;
13 | }) => {
14 |   const state = useAppState((state) => ({
15 |     instructions: state.ui.instructions,
16 |   }));
17 |   if (state.instructions) {
18 |     return null;
19 |   }
20 | 
21 |   const onButtonClick = (idx: number) => {
22 |     runTask(tasks[idx]);
23 |   };
24 | 
25 |   return (
26 |     <VStack spacing={2} align="stretch">
27 |       <Text fontSize="large" mt={1}>
28 |         Examples:
29 |       </Text>
30 |       <Button
31 |         textAlign="left"
32 |         display="block"
33 |         variant="outline"
34 |         height="4rem"
35 |         onClick={() => onButtonClick(0)}
36 |       >
37 |         <Text fontWeight={600} noOfLines={1}>
38 |           Post on twitter.com
39 |         </Text>
40 |         <Text fontWeight={400} noOfLines={1} color="gray">
41 |           with content &quot;An automated post from Fuji-Web by
42 |           @NormalComputing!&quot;
43 |         </Text>
44 |       </Button>
45 |       <Button
46 |         textAlign="left"
47 |         display="block"
48 |         variant="outline"
49 |         height="4rem"
50 |         onClick={() => onButtonClick(1)}
51 |       >
52 |         <Text fontWeight={600} noOfLines={1}>
53 |           Find a book about AI
54 |         </Text>
55 |         <Text fontWeight={400} noOfLines={1} color="gray">
56 |           and add a physical copy to cart on Amazon.com
57 |         </Text>
58 |       </Button>
59 |     </VStack>
60 |   );
61 | };
62 | 
63 | export default RecommendedTasks;
64 | 


--------------------------------------------------------------------------------
/src/common/RunTaskButton.tsx:
--------------------------------------------------------------------------------
 1 | import { Button, HStack, Icon } from "@chakra-ui/react";
 2 | import React from "react";
 3 | import { useAppState } from "../state/store";
 4 | import { BsPlayFill, BsStopFill } from "react-icons/bs";
 5 | 
 6 | export default function RunTaskButton(props: { runTask: () => void }) {
 7 |   const state = useAppState((state) => ({
 8 |     taskState: state.currentTask.status,
 9 |     instructions: state.ui.instructions,
10 |     interruptTask: state.currentTask.actions.interrupt,
11 |   }));
12 | 
13 |   let button = (
14 |     <Button
15 |       rightIcon={<Icon as={BsPlayFill} boxSize={6} />}
16 |       onClick={props.runTask}
17 |       colorScheme="green"
18 |       disabled={state.taskState === "running" || !state.instructions}
19 |     >
20 |       Start Task
21 |     </Button>
22 |   );
23 | 
24 |   if (state.taskState === "running") {
25 |     button = (
26 |       <Button
27 |         rightIcon={<Icon as={BsStopFill} boxSize={6} />}
28 |         onClick={state.interruptTask}
29 |         colorScheme="red"
30 |       >
31 |         Stop
32 |       </Button>
33 |     );
34 |   }
35 | 
36 |   return <HStack alignItems="center">{button}</HStack>;
37 | }
38 | 


--------------------------------------------------------------------------------
/src/common/TaskHistory.tsx:
--------------------------------------------------------------------------------
  1 | import { useState } from "react";
  2 | import {
  3 |   Alert,
  4 |   AlertIcon,
  5 |   AlertDescription,
  6 |   VStack,
  7 |   HStack,
  8 |   Box,
  9 |   Accordion,
 10 |   AccordionItem,
 11 |   Heading,
 12 |   AccordionButton,
 13 |   AccordionPanel,
 14 |   AccordionIcon,
 15 |   Icon,
 16 |   Spacer,
 17 |   ColorProps,
 18 |   BackgroundProps,
 19 | } from "@chakra-ui/react";
 20 | import { TaskHistoryEntry } from "../state/currentTask";
 21 | import { BsSortNumericDown, BsSortNumericUp } from "react-icons/bs";
 22 | import { useAppState } from "../state/store";
 23 | import CopyButton from "./CopyButton";
 24 | import Notes from "./CustomKnowledgeBase/Notes";
 25 | 
 26 | function MatchedNotes() {
 27 |   const knowledge = useAppState((state) => state.currentTask.knowledgeInUse);
 28 |   const notes = knowledge?.notes;
 29 |   if (!notes || notes.length === 0) {
 30 |     return null;
 31 |   }
 32 | 
 33 |   return (
 34 |     <AccordionItem>
 35 |       <Heading as="h3" size="sm">
 36 |         <AccordionButton>
 37 |           <Box mr="4" fontWeight="bold">
 38 |             0.
 39 |           </Box>
 40 |           <Box as="span" textAlign="left" flex="1">
 41 |             Found {notes.length} instructions.
 42 |           </Box>
 43 |           <AccordionIcon />
 44 |         </AccordionButton>
 45 |       </Heading>
 46 |       <AccordionPanel backgroundColor="gray.100" p="2">
 47 |         <Accordion allowMultiple w="full" defaultIndex={1}>
 48 |           <Box pl={2}>
 49 |             <Notes notes={notes} />
 50 |           </Box>
 51 |           <Alert status="info" borderRadius="sm" mt="1">
 52 |             <AlertIcon />
 53 |             <AlertDescription fontSize="0.8rem" lineHeight="4">
 54 |               You can customize instructions in the settings menu.
 55 |             </AlertDescription>
 56 |           </Alert>
 57 |         </Accordion>
 58 |       </AccordionPanel>
 59 |     </AccordionItem>
 60 |   );
 61 | }
 62 | 
 63 | type TaskHistoryItemProps = {
 64 |   index: number;
 65 |   entry: TaskHistoryEntry;
 66 | };
 67 | 
 68 | const CollapsibleComponent = (props: {
 69 |   title: string;
 70 |   subtitle?: string;
 71 |   text: string;
 72 | }) => (
 73 |   <AccordionItem backgroundColor="white">
 74 |     <Heading as="h4" size="xs">
 75 |       <AccordionButton>
 76 |         <HStack flex="1">
 77 |           <Box>{props.title}</Box>
 78 |           <CopyButton text={props.text} /> <Spacer />
 79 |           {props.subtitle && (
 80 |             <Box as="span" fontSize="xs" color="gray.500" mr={4}>
 81 |               {props.subtitle}
 82 |             </Box>
 83 |           )}
 84 |         </HStack>
 85 |         <AccordionIcon />
 86 |       </AccordionButton>
 87 |     </Heading>
 88 |     <AccordionPanel>
 89 |       {props.text.split("\n").map((line, index) => (
 90 |         <Box key={index} fontSize="xs">
 91 |           {line}
 92 |           <br />
 93 |         </Box>
 94 |       ))}
 95 |     </AccordionPanel>
 96 |   </AccordionItem>
 97 | );
 98 | 
 99 | const TaskHistoryItem = ({ index, entry }: TaskHistoryItemProps) => {
100 |   const itemTitle = entry.action.thought;
101 | 
102 |   const colors: {
103 |     text: ColorProps["textColor"];
104 |     bg: BackgroundProps["bgColor"];
105 |   } = {
106 |     text: undefined,
107 |     bg: undefined,
108 |   };
109 |   if (entry.action.operation.name === "fail") {
110 |     colors.text = "red.800";
111 |     colors.bg = "red.100";
112 |   } else if (entry.action.operation.name === "finish") {
113 |     colors.text = "green.800";
114 |     colors.bg = "green.100";
115 |   }
116 | 
117 |   return (
118 |     <AccordionItem>
119 |       <Heading as="h3" size="sm" textColor={colors.text} bgColor={colors.bg}>
120 |         <AccordionButton>
121 |           <Box mr="4" fontWeight="bold">
122 |             {index + 1}.
123 |           </Box>
124 |           <Box as="span" textAlign="left" flex="1">
125 |             {itemTitle}
126 |           </Box>
127 |           <AccordionIcon />
128 |         </AccordionButton>
129 |       </Heading>
130 |       <AccordionPanel backgroundColor="gray.100" p="2">
131 |         <Accordion allowMultiple w="full" defaultIndex={1}>
132 |           {entry.usage != null && (
133 |             <>
134 |               <CollapsibleComponent
135 |                 title="Prompt"
136 |                 subtitle={`${entry.usage.prompt_tokens} tokens`}
137 |                 text={entry.prompt}
138 |               />
139 |               <CollapsibleComponent
140 |                 title="Response"
141 |                 subtitle={`${entry.usage.completion_tokens} tokens`}
142 |                 text={entry.response}
143 |               />
144 |               <CollapsibleComponent
145 |                 title="Action"
146 |                 text={JSON.stringify(entry.action, null, 2)}
147 |               />
148 |             </>
149 |           )}
150 |         </Accordion>
151 |       </AccordionPanel>
152 |     </AccordionItem>
153 |   );
154 | };
155 | 
156 | export default function TaskHistory() {
157 |   const { taskHistory, taskStatus } = useAppState((state) => ({
158 |     taskStatus: state.currentTask.status,
159 |     taskHistory: state.currentTask.history,
160 |   }));
161 |   const [sortNumericDown, setSortNumericDown] = useState(false);
162 |   const toggleSort = () => {
163 |     setSortNumericDown(!sortNumericDown);
164 |   };
165 | 
166 |   if (taskHistory.length === 0 && taskStatus !== "running") return null;
167 |   const historyItems = taskHistory.map((entry, index) => (
168 |     <TaskHistoryItem key={index} index={index} entry={entry} />
169 |   ));
170 |   historyItems.unshift(<MatchedNotes key="matched-notes" />);
171 |   if (!sortNumericDown) {
172 |     historyItems.reverse();
173 |   }
174 | 
175 |   return (
176 |     <VStack mt={8}>
177 |       <HStack w="full">
178 |         <Heading as="h3" size="md">
179 |           Action History
180 |         </Heading>
181 |         <Spacer />
182 |         <Icon
183 |           as={sortNumericDown ? BsSortNumericDown : BsSortNumericUp}
184 |           cursor="pointer"
185 |           color="gray.500"
186 |           _hover={{ color: "gray.700" }}
187 |           onClick={toggleSort}
188 |         />
189 |         <CopyButton text={JSON.stringify(taskHistory, null, 2)} />
190 |       </HStack>
191 |       <Accordion allowMultiple w="full" pb="4">
192 |         {historyItems}
193 |       </Accordion>
194 |     </VStack>
195 |   );
196 | }
197 | 


--------------------------------------------------------------------------------
/src/common/TaskStatus.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { Box } from "@chakra-ui/react";
 3 | import { CurrentTaskSlice } from "../state/currentTask";
 4 | import { useAppState } from "../state/store";
 5 | 
 6 | export default function TaskStatus() {
 7 |   const { taskStatus, actionStatus } = useAppState((state) => ({
 8 |     taskStatus: state.currentTask.status,
 9 |     actionStatus: state.currentTask.actionStatus,
10 |   }));
11 | 
12 |   if (taskStatus !== "running") {
13 |     return null;
14 |   }
15 | 
16 |   const displayedStatus: Record<CurrentTaskSlice["actionStatus"], string> = {
17 |     idle: "💤 Idle",
18 |     "attaching-debugger": "🔗 Attaching Debugger",
19 |     "pulling-dom": "🌐 Understanding Website",
20 |     "annotating-page": "🌐 Understanding Website",
21 |     "fetching-knoweldge": "🧠 Getting Instructions",
22 |     "generating-action": "🤔 Thinking and planning",
23 |     "performing-action": "🚀 Performing Action",
24 |     waiting: "⏳ Waiting",
25 |   };
26 | 
27 |   return (
28 |     <Box textColor="gray.500" textAlign="center" mt={4} mb={-4} fontSize="sm">
29 |       {displayedStatus[actionStatus]}
30 |     </Box>
31 |   );
32 | }
33 | 


--------------------------------------------------------------------------------
/src/common/TaskUI.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useCallback } from "react";
  2 | import {
  3 |   Button,
  4 |   Box,
  5 |   HStack,
  6 |   Spacer,
  7 |   useToast,
  8 |   Alert,
  9 |   AlertIcon,
 10 |   AlertDescription,
 11 | } from "@chakra-ui/react";
 12 | import { debugMode } from "../constants";
 13 | import { useAppState } from "../state/store";
 14 | import RunTaskButton from "./RunTaskButton";
 15 | import VoiceButton from "./VoiceButton";
 16 | import TaskHistory from "./TaskHistory";
 17 | import TaskStatus from "./TaskStatus";
 18 | import RecommendedTasks from "./RecommendedTasks";
 19 | import AutosizeTextarea from "./AutosizeTextarea";
 20 | 
 21 | const injectContentScript = async () => {
 22 |   const [tab] = await chrome.tabs.query({ currentWindow: true, active: true });
 23 |   if (!tab || !tab.id) {
 24 |     return;
 25 |   }
 26 | 
 27 |   await chrome.scripting.executeScript({
 28 |     target: { tabId: tab.id },
 29 |     files: ["src/pages/contentInjected/index.js"],
 30 |     world: "MAIN",
 31 |   });
 32 | };
 33 | 
 34 | function ActionExecutor() {
 35 |   const state = useAppState((state) => ({
 36 |     attachDebugger: state.currentTask.actions.attachDebugger,
 37 |     detachDegugger: state.currentTask.actions.detachDebugger,
 38 |     performActionString: state.currentTask.actions.performActionString,
 39 |     prepareLabels: state.currentTask.actions.prepareLabels,
 40 |     showImagePrompt: state.currentTask.actions.showImagePrompt,
 41 |   }));
 42 |   return (
 43 |     <Box mt={4}>
 44 |       <HStack
 45 |         columnGap="0.5rem"
 46 |         rowGap="0.5rem"
 47 |         fontSize="md"
 48 |         borderTop="1px dashed gray"
 49 |         py="3"
 50 |         shouldWrapChildren
 51 |         wrap="wrap"
 52 |       >
 53 |         <Button onClick={state.attachDebugger}>Attach</Button>
 54 |         <Button onClick={state.prepareLabels}>Prepare</Button>
 55 |         <Button onClick={state.showImagePrompt}>Show Image</Button>
 56 |         <Button
 57 |           onClick={() => {
 58 |             injectContentScript();
 59 |           }}
 60 |         >
 61 |           Inject
 62 |         </Button>
 63 |       </HStack>
 64 |     </Box>
 65 |   );
 66 | }
 67 | 
 68 | const TaskUI = () => {
 69 |   const state = useAppState((state) => ({
 70 |     taskHistory: state.currentTask.history,
 71 |     taskStatus: state.currentTask.status,
 72 |     runTask: state.currentTask.actions.runTask,
 73 |     instructions: state.ui.instructions,
 74 |     setInstructions: state.ui.actions.setInstructions,
 75 |     voiceMode: state.settings.voiceMode,
 76 |     isListening: state.currentTask.isListening,
 77 |   }));
 78 |   const taskInProgress = state.taskStatus === "running";
 79 | 
 80 |   const toast = useToast();
 81 | 
 82 |   const toastError = useCallback(
 83 |     (message: string) => {
 84 |       toast({
 85 |         title: "Error",
 86 |         description: message,
 87 |         status: "error",
 88 |         duration: 5000,
 89 |         isClosable: true,
 90 |       });
 91 |     },
 92 |     [toast],
 93 |   );
 94 | 
 95 |   const runTask = useCallback(() => {
 96 |     state.instructions && state.runTask(toastError);
 97 |   }, [state, toastError]);
 98 | 
 99 |   const runTaskWithNewInstructions = (newInstructions: string = "") => {
100 |     if (!newInstructions) {
101 |       return;
102 |     }
103 |     state.setInstructions(newInstructions);
104 |     state.runTask(toastError);
105 |   };
106 | 
107 |   const onKeyDown = (e: React.KeyboardEvent<HTMLTextAreaElement>) => {
108 |     if (e.key === "Enter" && e.shiftKey) {
109 |       e.preventDefault();
110 |       runTask();
111 |     }
112 |   };
113 | 
114 |   return (
115 |     <>
116 |       <AutosizeTextarea
117 |         // eslint-disable-next-line jsx-a11y/no-autofocus
118 |         autoFocus
119 |         placeholder="Try telling Fuji to do a task"
120 |         value={state.instructions || ""}
121 |         isDisabled={taskInProgress || state.isListening}
122 |         onChange={(e) => state.setInstructions(e.target.value)}
123 |         mb={2}
124 |         onKeyDown={onKeyDown}
125 |       />
126 |       <HStack mt={2} mb={2}>
127 |         <RunTaskButton runTask={runTask} />
128 |         {state.voiceMode && (
129 |           <VoiceButton
130 |             taskInProgress={taskInProgress}
131 |             onStopSpeaking={runTask}
132 |           />
133 |         )}
134 |         <Spacer />
135 |       </HStack>
136 |       {state.voiceMode && (
137 |         <Alert status="info" borderRadius="lg">
138 |           <AlertIcon />
139 |           <AlertDescription fontSize="sm" lineHeight="5">
140 |             In Voice Mode, you can press Space to start speaking and Space again
141 |             to stop. Fuji will run the task when you stop speaking. To turn off
142 |             Voice Mode, click the Setting icon in the top right corner.
143 |           </AlertDescription>
144 |         </Alert>
145 |       )}
146 |       {!state.voiceMode && !state.instructions && (
147 |         <RecommendedTasks runTask={runTaskWithNewInstructions} />
148 |       )}
149 |       {debugMode && <ActionExecutor />}
150 |       <TaskStatus />
151 |       <TaskHistory />
152 |     </>
153 |   );
154 | };
155 | 
156 | export default TaskUI;
157 | 


--------------------------------------------------------------------------------
/src/common/TokenCount.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { Text } from "@chakra-ui/react";
 3 | import { countTokens } from "../helpers/countTokens";
 4 | import { useAsync } from "react-use";
 5 | import { useAppState } from "../state/store";
 6 | 
 7 | const TokenCount = ({ html }: { html: string }) => {
 8 |   const selectedModel = useAppState((state) => state.settings.selectedModel);
 9 | 
10 |   const numTokens =
11 |     useAsync(
12 |       () => countTokens(html, selectedModel as string),
13 |       [html, selectedModel],
14 |     ).value || null;
15 | 
16 |   let displayedCount = null;
17 |   if (!html) {
18 |     displayedCount = "Waiting for HTML";
19 |   } else if (numTokens === null) {
20 |     displayedCount = "Counting...";
21 |   } else {
22 |     displayedCount = numTokens + " tokens";
23 |   }
24 | 
25 |   return (
26 |     <>
27 |       <Text as="span" fontSize="sm" color="gray.500">
28 |         {displayedCount}
29 |       </Text>
30 |     </>
31 |   );
32 | };
33 | 
34 | export default TokenCount;
35 | 


--------------------------------------------------------------------------------
/src/common/VoiceButton.tsx:
--------------------------------------------------------------------------------
 1 | import { useEffect, useCallback } from "react";
 2 | import { Button, HStack, Icon } from "@chakra-ui/react";
 3 | import { BsPlayFill, BsStopFill } from "react-icons/bs";
 4 | import { useAppState } from "../state/store";
 5 | 
 6 | export default function VoiceButton({
 7 |   taskInProgress,
 8 |   onStopSpeaking,
 9 | }: {
10 |   taskInProgress: boolean;
11 |   onStopSpeaking: () => void;
12 | }) {
13 |   const state = useAppState((state) => ({
14 |     isListening: state.currentTask.isListening,
15 |     startListening: state.currentTask.actions.startListening,
16 |     stopListening: state.currentTask.actions.stopListening,
17 |   }));
18 | 
19 |   const toggleVoiceControl = useCallback(() => {
20 |     if (!taskInProgress) {
21 |       if (!state.isListening) {
22 |         state.startListening();
23 |       } else {
24 |         state.stopListening();
25 |         onStopSpeaking();
26 |       }
27 |     }
28 |   }, [state, taskInProgress, onStopSpeaking]);
29 | 
30 |   useEffect(() => {
31 |     if (!taskInProgress) {
32 |       const handleKeyDown = (event: KeyboardEvent) => {
33 |         if (event.code === "Space") {
34 |           event.preventDefault();
35 |           toggleVoiceControl();
36 |         }
37 |       };
38 | 
39 |       window.addEventListener("keydown", handleKeyDown);
40 |       return () => window.removeEventListener("keydown", handleKeyDown);
41 |     }
42 |   }, [taskInProgress, toggleVoiceControl]);
43 | 
44 |   const button = (
45 |     <Button
46 |       rightIcon={
47 |         <Icon as={state.isListening ? BsStopFill : BsPlayFill} boxSize={6} />
48 |       }
49 |       onClick={toggleVoiceControl}
50 |       colorScheme={state.isListening ? "red" : "blue"}
51 |       isDisabled={taskInProgress}
52 |     >
53 |       {state.isListening ? "Stop" : "Start"} Speaking
54 |     </Button>
55 |   );
56 | 
57 |   return <HStack alignItems="center">{button}</HStack>;
58 | }
59 | 


--------------------------------------------------------------------------------
/src/common/settings/AgentModeDropdown.tsx:
--------------------------------------------------------------------------------
 1 | import { Select } from "@chakra-ui/react";
 2 | import { useAppState } from "../../state/store";
 3 | import { AgentMode } from "../../helpers/aiSdkUtils";
 4 | import { enumValues } from "../../helpers/utils";
 5 | 
 6 | const DisplayName = {
 7 |   //   [AgentMode.Vision]: "Pure Vision",
 8 |   [AgentMode.VisionEnhanced]: "Vision Enhanced",
 9 |   [AgentMode.Text]: "Text",
10 | };
11 | 
12 | const AgentModeDrop = () => {
13 |   const { agentMode, updateSettings } = useAppState((state) => ({
14 |     agentMode: state.settings.agentMode,
15 |     updateSettings: state.settings.actions.update,
16 |   }));
17 | 
18 |   return (
19 |     <Select
20 |       id="agent-mode-select"
21 |       value={agentMode || ""}
22 |       onChange={(e) =>
23 |         updateSettings({ agentMode: e.target.value as AgentMode })
24 |       }
25 |     >
26 |       {enumValues(AgentMode).map((mode) => (
27 |         <option key={mode} value={mode}>
28 |           {DisplayName[mode]}
29 |         </option>
30 |       ))}
31 |     </Select>
32 |   );
33 | };
34 | 
35 | export default AgentModeDrop;
36 | 


--------------------------------------------------------------------------------
/src/common/settings/ModelDropdown.tsx:
--------------------------------------------------------------------------------
 1 | import { Select } from "@chakra-ui/react";
 2 | import { useAppState } from "../../state/store";
 3 | import {
 4 |   SupportedModels,
 5 |   DisplayName,
 6 |   isValidModelSettings,
 7 | } from "../../helpers/aiSdkUtils";
 8 | import { enumValues } from "../../helpers/utils";
 9 | 
10 | const ModelDropdown = () => {
11 |   const { selectedModel, agentMode, updateSettings } = useAppState((state) => ({
12 |     selectedModel: state.settings.selectedModel,
13 |     agentMode: state.settings.agentMode,
14 |     updateSettings: state.settings.actions.update,
15 |   }));
16 | 
17 |   const { openAIKey, anthropicKey, geminiKey } = useAppState((state) => ({
18 |     openAIKey: state.settings.openAIKey,
19 |     anthropicKey: state.settings.anthropicKey,
20 |     geminiKey: state.settings.geminiKey,
21 |   }));
22 | 
23 |   return (
24 |     <Select
25 |       id="model-select"
26 |       value={selectedModel || ""}
27 |       onChange={(e) =>
28 |         updateSettings({ selectedModel: e.target.value as SupportedModels })
29 |       }
30 |     >
31 |       {enumValues(SupportedModels).map((model) => (
32 |         <option
33 |           key={model}
34 |           value={model}
35 |           disabled={
36 |             !isValidModelSettings(
37 |               model,
38 |               agentMode,
39 |               openAIKey,
40 |               anthropicKey,
41 |               geminiKey,
42 |             )
43 |           }
44 |         >
45 |           {DisplayName[model]}
46 |         </option>
47 |       ))}
48 |     </Select>
49 |   );
50 | };
51 | 
52 | export default ModelDropdown;
53 | 


--------------------------------------------------------------------------------
/src/common/settings/SetAPIKey.tsx:
--------------------------------------------------------------------------------
  1 | import {
  2 |   AbsoluteCenter,
  3 |   Box,
  4 |   Button,
  5 |   Divider,
  6 |   Input,
  7 |   VStack,
  8 |   Text,
  9 |   Link,
 10 |   HStack,
 11 |   FormControl,
 12 |   FormLabel,
 13 | } from "@chakra-ui/react";
 14 | import React from "react";
 15 | import { useAppState } from "../../state/store";
 16 | 
 17 | type SetAPIKeyProps = {
 18 |   asInitializerView?: boolean;
 19 |   initialOpenAIKey?: string;
 20 |   initialAnthropicKey?: string;
 21 |   initialGeminiKey?: string;
 22 |   onClose?: () => void;
 23 | };
 24 | 
 25 | const SetAPIKey = ({
 26 |   asInitializerView = false,
 27 |   initialOpenAIKey = "",
 28 |   initialAnthropicKey = "",
 29 |   initialGeminiKey = "",
 30 |   onClose,
 31 | }: SetAPIKeyProps) => {
 32 |   const { updateSettings, initialOpenAIBaseUrl, initialAnthropicBaseUrl } =
 33 |     useAppState((state) => ({
 34 |       initialOpenAIBaseUrl: state.settings.openAIBaseUrl,
 35 |       initialAnthropicBaseUrl: state.settings.anthropicBaseUrl,
 36 |       updateSettings: state.settings.actions.update,
 37 |     }));
 38 | 
 39 |   const [openAIKey, setOpenAIKey] = React.useState(initialOpenAIKey || "");
 40 |   const [anthropicKey, setAnthropicKey] = React.useState(
 41 |     initialAnthropicKey || "",
 42 |   );
 43 |   const [geminiKey, setGeminiKey] = React.useState(initialGeminiKey || "");
 44 |   const [openAIBaseUrl, setOpenAIBaseUrl] = React.useState(
 45 |     initialOpenAIBaseUrl || "",
 46 |   );
 47 |   const [anthropicBaseUrl, setAnthropicBaseUrl] = React.useState(
 48 |     initialAnthropicBaseUrl || "",
 49 |   );
 50 | 
 51 |   const [showPassword, setShowPassword] = React.useState(false);
 52 | 
 53 |   const onSave = () => {
 54 |     updateSettings({
 55 |       openAIKey,
 56 |       openAIBaseUrl,
 57 |       anthropicKey,
 58 |       anthropicBaseUrl,
 59 |       geminiKey,
 60 |     });
 61 |     onClose && onClose();
 62 |   };
 63 | 
 64 |   return (
 65 |     <VStack spacing={4}>
 66 |       <Text fontSize="sm">
 67 |         You&rsquo;ll need an OpenAI or Anthropic API Key to run the Fuji in
 68 |         developer mode. If you don&rsquo;t already have one available, you can
 69 |         create one in your{" "}
 70 |         <Link
 71 |           href="https://platform.openai.com/account/api-keys"
 72 |           color="blue"
 73 |           isExternal
 74 |         >
 75 |           OpenAI account
 76 |         </Link>{" "}
 77 |         or your{" "}
 78 |         <Link
 79 |           href="https://console.anthropic.com/settings/keys"
 80 |           color="blue"
 81 |           isExternal
 82 |         >
 83 |           Anthropic account
 84 |         </Link>
 85 |         .
 86 |         <br />
 87 |         <br />
 88 |         Fuji stores your API keys locally on your device, and they are only used
 89 |         to communicate with the OpenAI API and/or the Anthropic API.
 90 |       </Text>
 91 |       <Box position="relative" py="2" w="full">
 92 |         <Divider />
 93 |         <AbsoluteCenter bg="white" px="4">
 94 |           OpenAI
 95 |         </AbsoluteCenter>
 96 |       </Box>
 97 |       <FormControl>
 98 |         <FormLabel>OpenAI API Key</FormLabel>
 99 |         <HStack w="full">
100 |           <Input
101 |             placeholder="Enter OpenAI API Key"
102 |             value={openAIKey}
103 |             onChange={(event) => setOpenAIKey(event.target.value)}
104 |             type={showPassword ? "text" : "password"}
105 |           />
106 |           {asInitializerView && (
107 |             <Button
108 |               onClick={() => setShowPassword(!showPassword)}
109 |               variant="outline"
110 |             >
111 |               {showPassword ? "Hide" : "Show"}
112 |             </Button>
113 |           )}
114 |         </HStack>
115 |       </FormControl>
116 |       {!asInitializerView && (
117 |         <FormControl>
118 |           <FormLabel>Base Url (optional)</FormLabel>
119 |           <Input
120 |             placeholder="Set Base Url"
121 |             value={openAIBaseUrl}
122 |             onChange={(event) => setOpenAIBaseUrl(event.target.value)}
123 |             type="text"
124 |           />
125 |         </FormControl>
126 |       )}
127 | 
128 |       <Box position="relative" py={2} w="full">
129 |         <Divider />
130 |         <AbsoluteCenter bg="white" px="4">
131 |           Anthropic
132 |         </AbsoluteCenter>
133 |       </Box>
134 |       <FormControl>
135 |         <FormLabel>Anthropic API Key</FormLabel>
136 |         <HStack w="full">
137 |           <Input
138 |             placeholder="Enter Anthropic API Key"
139 |             value={anthropicKey}
140 |             onChange={(event) => setAnthropicKey(event.target.value)}
141 |             type={showPassword ? "text" : "password"}
142 |           />
143 |           {asInitializerView && (
144 |             <Button
145 |               onClick={() => setShowPassword(!showPassword)}
146 |               variant="outline"
147 |             >
148 |               {showPassword ? "Hide" : "Show"}
149 |             </Button>
150 |           )}
151 |         </HStack>
152 |       </FormControl>
153 |       {!asInitializerView && (
154 |         <FormControl>
155 |           <FormLabel>Base Url (optional)</FormLabel>
156 |           <Input
157 |             placeholder="Set Base Url"
158 |             value={anthropicBaseUrl}
159 |             onChange={(event) => setAnthropicBaseUrl(event.target.value)}
160 |             type="text"
161 |           />
162 |         </FormControl>
163 |       )}
164 | 
165 |       <Box position="relative" py={2} w="full">
166 |         <Divider />
167 |         <AbsoluteCenter bg="white" px="4">
168 |           Gemini (Google)
169 |         </AbsoluteCenter>
170 |       </Box>
171 |       <FormControl>
172 |         <FormLabel>Gemini API Key</FormLabel>
173 |         <HStack w="full">
174 |           <Input
175 |             placeholder="Enter Gemini API Key"
176 |             value={geminiKey}
177 |             onChange={(event) => setGeminiKey(event.target.value)}
178 |             type={showPassword ? "text" : "password"}
179 |           />
180 |           {asInitializerView && (
181 |             <Button
182 |               onClick={() => setShowPassword(!showPassword)}
183 |               variant="outline"
184 |             >
185 |               {showPassword ? "Hide" : "Show"}
186 |             </Button>
187 |           )}
188 |         </HStack>
189 |       </FormControl>
190 | 
191 |       <Button
192 |         onClick={onSave}
193 |         w="full"
194 |         isDisabled={!openAIKey && !anthropicKey && !geminiKey}
195 |         colorScheme="blue"
196 |       >
197 |         Save
198 |       </Button>
199 |     </VStack>
200 |   );
201 | };
202 | 
203 | export default SetAPIKey;
204 | 


--------------------------------------------------------------------------------
/src/constants.ts:
--------------------------------------------------------------------------------
1 | export const TAXY_ELEMENT_SELECTOR = "data-taxy-node-id";
2 | export const VISIBLE_TEXT_ATTRIBUTE_NAME = "data-web-wand-visible-text";
3 | export const ARIA_LABEL_ATTRIBUTE_NAME = "data-web-wand-aria-label";
4 | export const WEB_WAND_LABEL_ATTRIBUTE_NAME = "data-web-wand-label";
5 | 
6 | // read from env
7 | export const debugMode = import.meta.env.VITE_DEBUG_MODE === "true";
8 | 


--------------------------------------------------------------------------------
/src/environment.d.ts:
--------------------------------------------------------------------------------
 1 | declare global {
 2 |   namespace NodeJS {
 3 |     interface ProcessEnv {
 4 |       __DEV__: string;
 5 |       __FIREFOX__: string;
 6 |     }
 7 |   }
 8 | }
 9 | 
10 | export {};
11 | 


--------------------------------------------------------------------------------
/src/global.d.ts:
--------------------------------------------------------------------------------
 1 | declare module "virtual:reload-on-update-in-background-script" {
 2 |   export const reloadOnUpdate: (watchPath: string) => void;
 3 |   export default reloadOnUpdate;
 4 | }
 5 | 
 6 | declare module "virtual:reload-on-update-in-view" {
 7 |   const refreshOnUpdate: (watchPath: string) => void;
 8 |   export default refreshOnUpdate;
 9 | }
10 | 
11 | declare module "*.svg" {
12 |   import React = require("react");
13 |   export const ReactComponent: React.SFC<React.SVGProps<SVGSVGElement>>;
14 |   const src: string;
15 |   export default src;
16 | }
17 | 
18 | declare module "*.jpg" {
19 |   const content: string;
20 |   export default content;
21 | }
22 | 
23 | declare module "*.png" {
24 |   const content: string;
25 |   export default content;
26 | }
27 | 
28 | declare module "*.json" {
29 |   const content: string;
30 |   export default content;
31 | }
32 | 


--------------------------------------------------------------------------------
/src/helpers/browserUtils.ts:
--------------------------------------------------------------------------------
 1 | export async function findActiveTab(): Promise<chrome.tabs.Tab | null> {
 2 |   const currentWindow = await chrome.windows.getCurrent();
 3 |   if (!currentWindow || !currentWindow.id) {
 4 |     throw new Error("Could not find window");
 5 |   }
 6 |   const tabs = await chrome.tabs.query({
 7 |     active: true,
 8 |     windowId: currentWindow.id,
 9 |   });
10 |   const tab = tabs[0];
11 |   if (tab && tab.id != null) {
12 |     return tab;
13 |   }
14 |   return null;
15 | }
16 | 


--------------------------------------------------------------------------------
/src/helpers/buildAnnotatedScreenshots.ts:
--------------------------------------------------------------------------------
 1 | import { sleep } from "./utils";
 2 | import { callRPCWithTab } from "./rpc/pageRPC";
 3 | import mergeImages from "@src/shared/images/mergeScreenshots";
 4 | import { type LabelData } from "../pages/content/drawLabels";
 5 | import { type Knowledge } from "./knowledge";
 6 | 
 7 | export default async function buildAnnotatedScreenshots(
 8 |   tabId: number,
 9 |   knowledge: Knowledge,
10 | ): Promise<[string, LabelData[]]> {
11 |   const imgDataRaw = await chrome.tabs.captureVisibleTab({
12 |     format: "png",
13 |   });
14 |   const labelData = await callRPCWithTab(tabId, "drawLabels", [knowledge]);
15 |   await sleep(300);
16 |   const imgDataAnnotated = await chrome.tabs.captureVisibleTab({
17 |     format: "png",
18 |   });
19 |   const imgData = await mergeImages([
20 |     { src: imgDataRaw, caption: "Clean Screenshot" },
21 |     { src: imgDataAnnotated, caption: "Annotated Screenshot" },
22 |   ]);
23 |   await sleep(300);
24 |   await callRPCWithTab(tabId, "removeLabels", []);
25 | 
26 |   return [imgData, labelData];
27 | }
28 | 


--------------------------------------------------------------------------------
/src/helpers/chromeDebugger.ts:
--------------------------------------------------------------------------------
 1 | // Not sure why but this won't work properly if running inside a devtools panel
 2 | // a lot of tabs are shown as attached to debugger when they are not
 3 | // export async function isDebuggerAttached(tabId: number) {
 4 | //   const targets = await chrome.debugger.getTargets();
 5 | //   console.log(targets);
 6 | //   return targets.some((target) => target.tabId === tabId && target.attached);
 7 | // }
 8 | 
 9 | // maintain a set of attached tabs
10 | const attachedTabs = new Set<number>();
11 | let detachListenerSetUp = false;
12 | 
13 | function setUpDetachListener() {
14 |   // only set up the listener once
15 |   if (detachListenerSetUp) return;
16 |   detachListenerSetUp = true;
17 |   chrome.tabs.onRemoved.addListener((tabId) => {
18 |     if (attachedTabs.has(tabId)) {
19 |       attachedTabs.delete(tabId);
20 |     }
21 |   });
22 |   chrome.debugger.onDetach.addListener((source) => {
23 |     if (source.tabId) {
24 |       attachedTabs.delete(source.tabId);
25 |     }
26 |   });
27 | }
28 | 
29 | export async function attachDebugger(tabId: number) {
30 |   setUpDetachListener();
31 |   console.log("start attachDebugger");
32 |   // const isAttached = await isDebuggerAttached(tabId);
33 |   const isAttached = attachedTabs.has(tabId);
34 |   if (isAttached) {
35 |     console.log("already attached to debugger", tabId);
36 |     return;
37 |   }
38 |   return new Promise<void>((resolve, reject) => {
39 |     return chrome.debugger.attach({ tabId }, "1.3", async () => {
40 |       if (chrome.runtime.lastError) {
41 |         console.error(
42 |           "Failed to attach debugger:",
43 |           chrome.runtime.lastError.message,
44 |         );
45 |         reject(
46 |           new Error(
47 |             `Failed to attach debugger: ${chrome.runtime.lastError.message}`,
48 |           ),
49 |         );
50 |       } else {
51 |         console.log("attached to debugger");
52 |         await chrome.debugger.sendCommand({ tabId }, "DOM.enable");
53 |         console.log("DOM enabled");
54 |         await chrome.debugger.sendCommand({ tabId }, "Runtime.enable");
55 |         console.log("Runtime enabled");
56 |         attachedTabs.add(tabId);
57 |         resolve();
58 |       }
59 |     });
60 |   });
61 | }
62 | 
63 | export async function detachDebugger(tabId: number) {
64 |   attachedTabs.delete(tabId);
65 |   chrome.debugger.detach({ tabId: tabId });
66 | }
67 | 
68 | export async function detachAllDebuggers() {
69 |   for (const tabId of attachedTabs) {
70 |     await detachDebugger(tabId);
71 |   }
72 | }
73 | 


--------------------------------------------------------------------------------
/src/helpers/countTokens.ts:
--------------------------------------------------------------------------------
 1 | export const countTokens = async (text: string, model_name: string) => {
 2 |   const response = await fetch("https://tiktoken-api.vercel.app/token_count", {
 3 |     method: "POST",
 4 |     headers: {
 5 |       "Content-Type": "application/json",
 6 |     },
 7 |     body: JSON.stringify({
 8 |       text,
 9 |       model_name,
10 |     }),
11 |   });
12 |   const data = await response.json();
13 |   return data.token_count;
14 | };
15 | 


--------------------------------------------------------------------------------
/src/helpers/disableExtensions.ts:
--------------------------------------------------------------------------------
 1 | // These are extensions that are known to interfere with the operation of Taxy.
 2 | // We'll turn them off temporarily while Taxy is performing actions.
 3 | const incompatibleExtensions = [
 4 |   // Dashlane
 5 |   "fdjamakpfbbddfjaooikfcpapjohcfmg",
 6 |   // LastPass
 7 |   "hdokiejnpimakedhajhdlcegeplioahd",
 8 | ];
 9 | 
10 | const disableCounts: Record<string, number> = {};
11 | 
12 | export const disableIncompatibleExtensions = async () => {
13 |   const enabledBlacklistedExtensions = await new Promise<
14 |     chrome.management.ExtensionInfo[]
15 |   >((resolve, reject) => {
16 |     chrome.management.getAll((extensions) => {
17 |       if (chrome.runtime.lastError) {
18 |         console.error(
19 |           "Failed to get extensions:",
20 |           chrome.runtime.lastError.message,
21 |         );
22 |         reject(chrome.runtime.lastError);
23 |       } else {
24 |         resolve(
25 |           extensions.filter(
26 |             (extension) =>
27 |               extension.type === "extension" &&
28 |               extension.enabled &&
29 |               incompatibleExtensions.includes(extension.id),
30 |           ),
31 |         );
32 |       }
33 |     });
34 |   });
35 | 
36 |   for (const extension of enabledBlacklistedExtensions) {
37 |     chrome.management.setEnabled(extension.id, false, () => {
38 |       if (chrome.runtime.lastError) {
39 |         console.error(
40 |           `Failed to disable extension ${extension.id}:`,
41 |           chrome.runtime.lastError.message,
42 |         );
43 |       }
44 |       disableCounts[extension.id] = (disableCounts[extension.id] || 0) + 1;
45 |     });
46 |   }
47 | };
48 | 
49 | export const reenableExtensions = async () => {
50 |   const disabledBlacklistedExtensions = await new Promise<
51 |     chrome.management.ExtensionInfo[]
52 |   >((resolve, reject) => {
53 |     chrome.management.getAll((extensions) => {
54 |       if (chrome.runtime.lastError) {
55 |         console.error(
56 |           "Failed to get extensions:",
57 |           chrome.runtime.lastError.message,
58 |         );
59 |         reject(chrome.runtime.lastError);
60 |       } else {
61 |         resolve(
62 |           extensions.filter(
63 |             (extension) =>
64 |               extension.type === "extension" &&
65 |               !extension.enabled &&
66 |               incompatibleExtensions.includes(extension.id),
67 |           ),
68 |         );
69 |       }
70 |     });
71 |   });
72 | 
73 |   for (const extension of disabledBlacklistedExtensions) {
74 |     if (disableCounts[extension.id] > 1) {
75 |       // If we have multiple sessions running and have disabled the extension
76 |       // multiple times, we only want to re-enable it once all sessions have
77 |       // finished.
78 |       disableCounts[extension.id] = disableCounts[extension.id] - 1;
79 |     } else if (disableCounts[extension.id] === 1) {
80 |       await new Promise((resolve, reject) => {
81 |         chrome.management.setEnabled(extension.id, true, () => {
82 |           if (chrome.runtime.lastError) {
83 |             console.error(
84 |               `Failed to enable extension ${extension.id}:`,
85 |               chrome.runtime.lastError.message,
86 |             );
87 |             reject(chrome.runtime.lastError);
88 |           }
89 |           delete disableCounts[extension.id];
90 |           resolve(0);
91 |         });
92 |       });
93 |     }
94 |   }
95 | };
96 | 


--------------------------------------------------------------------------------
/src/helpers/dom-agent/availableActions.ts:
--------------------------------------------------------------------------------
 1 | const commonActions = [
 2 |   {
 3 |     name: "wait",
 4 |     description:
 5 |       "Wait for 3 seconds before the next action. Useful when the page is loading.",
 6 |     args: [],
 7 |   },
 8 |   {
 9 |     name: "finish",
10 |     description: "Indicate the task is finished",
11 |     args: [],
12 |   },
13 |   {
14 |     name: "fail",
15 |     description: "Indicate that you are unable to complete the task",
16 |     args: [],
17 |   },
18 | ] as const;
19 | 
20 | export const availableActions = [
21 |   {
22 |     name: "click",
23 |     description: "Click on an element",
24 |     args: [
25 |       {
26 |         name: "elementId",
27 |         type: "string",
28 |       },
29 |     ],
30 |   },
31 |   {
32 |     name: "setValue",
33 |     description: "Focus on and sets the value of an input element",
34 |     args: [
35 |       {
36 |         name: "elementId",
37 |         type: "string",
38 |       },
39 |       {
40 |         name: "value",
41 |         type: "string",
42 |       },
43 |     ],
44 |   },
45 |   ...commonActions,
46 | ] as const;
47 | 
48 | type AvailableAction = (typeof availableActions)[number];
49 | 
50 | type ArgsToObject<T extends ReadonlyArray<{ name: string; type: string }>> = {
51 |   [K in T[number]["name"]]: Extract<
52 |     T[number],
53 |     { name: K }
54 |   >["type"] extends "number"
55 |     ? number
56 |     : string;
57 | };
58 | 
59 | export type ActionShape<
60 |   T extends {
61 |     name: string;
62 |     args: ReadonlyArray<{ name: string; type: string }>;
63 |   },
64 | > = {
65 |   name: T["name"];
66 |   args: ArgsToObject<T["args"]>;
67 | };
68 | 
69 | export type ActionPayload = {
70 |   [K in AvailableAction["name"]]: ActionShape<
71 |     Extract<AvailableAction, { name: K }>
72 |   >;
73 | }[AvailableAction["name"]];
74 | 


--------------------------------------------------------------------------------
/src/helpers/dom-agent/determineNextAction.ts:
--------------------------------------------------------------------------------
  1 | import { useAppState } from "../../state/store";
  2 | import { availableActions } from "./availableActions";
  3 | import { ParsedResponseSuccess, parseResponse } from "./parseResponse";
  4 | import { QueryResult } from "../vision-agent/determineNextAction";
  5 | import errorChecker from "../errorChecker";
  6 | import { fetchResponseFromModel } from "../aiSdkUtils";
  7 | 
  8 | type Action = NonNullable<QueryResult>["action"];
  9 | 
 10 | const formattedActions = availableActions
 11 |   .map((action, i) => {
 12 |     const args = action.args
 13 |       .map((arg) => `${arg.name}: ${arg.type}`)
 14 |       .join(", ");
 15 |     return `${i + 1}. ${action.name}(${args}): ${action.description}`;
 16 |   })
 17 |   .join("\n");
 18 | 
 19 | const systemMessage = `
 20 | You are a browser automation assistant.
 21 | 
 22 | You can use the following tools:
 23 | 
 24 | ${formattedActions}
 25 | 
 26 | You will be given a task to perform and the current state of the DOM.
 27 | You will also be given previous actions that you have taken. You may retry a failed action up to one time.
 28 | 
 29 | There are two examples of actions:
 30 | 
 31 | Example 1:
 32 | {
 33 |   thought: "I am clicking the add to cart button",
 34 |   action: "click(223)"
 35 | }
 36 | 
 37 | Example 2:
 38 | {
 39 |   thought: "I am typing 'fish food' into the search bar",
 40 |   action: "setValue(123, 'fish food')"
 41 | }
 42 | 
 43 | Example 3:
 44 | {
 45 |   thought: "I continue to scroll down to find the section",
 46 |   action: "scroll('down')"
 47 | }
 48 | 
 49 | Your response must always be in JSON format and must include "thought" and "action".
 50 | When finish, use "finish()" in "action" and include a brief summary of the task in "thought".
 51 | `;
 52 | 
 53 | export async function determineNextAction(
 54 |   taskInstructions: string,
 55 |   previousActions: Action[],
 56 |   simplifiedDOM: string,
 57 |   maxAttempts = 3,
 58 |   notifyError?: (error: string) => void,
 59 | ): Promise<QueryResult> {
 60 |   const model = useAppState.getState().settings.selectedModel;
 61 |   const prompt = formatPrompt(taskInstructions, previousActions, simplifiedDOM);
 62 | 
 63 |   for (let i = 0; i < maxAttempts; i++) {
 64 |     try {
 65 |       const completion = await fetchResponseFromModel(model, {
 66 |         systemMessage,
 67 |         prompt,
 68 |         jsonMode: true,
 69 |       });
 70 | 
 71 |       const rawResponse = completion.rawResponse;
 72 | 
 73 |       try {
 74 |         const parsed = await parseResponse(rawResponse);
 75 |         if ("error" in parsed) {
 76 |           throw new Error(parsed.error);
 77 |         }
 78 |         return {
 79 |           usage: completion.usage,
 80 |           prompt,
 81 |           rawResponse,
 82 |           // TODO: refactor dom agent so we don't need this
 83 |           action: visionActionAdapter(parsed),
 84 |         };
 85 |       } catch (e) {
 86 |         console.error("Failed to parse response", e);
 87 |       }
 88 |       // eslint-disable-next-line @typescript-eslint/no-explicit-any
 89 |     } catch (error: any) {
 90 |       if (error instanceof Error) {
 91 |         const recoverable = errorChecker(error, notifyError);
 92 |         if (!recoverable) {
 93 |           throw error;
 94 |         }
 95 |       } else {
 96 |         console.error("Unexpected determineNextAction error:");
 97 |         console.error(error);
 98 |       }
 99 |     }
100 |   }
101 |   const errMsg = `Failed to complete query after ${maxAttempts} attempts. Please try again later.`;
102 |   if (notifyError) {
103 |     notifyError(errMsg);
104 |   }
105 |   throw new Error(errMsg);
106 | }
107 | 
108 | export function formatPrompt(
109 |   taskInstructions: string,
110 |   previousActions: Action[],
111 |   pageContents?: string,
112 | ) {
113 |   let previousActionsString = "";
114 | 
115 |   if (previousActions.length > 0) {
116 |     const serializedActions = previousActions
117 |       .map(
118 |         (action) =>
119 |           `Thought: ${action.thought}\nAction:${JSON.stringify(
120 |             action.operation,
121 |           )}`,
122 |       )
123 |       .join("\n\n");
124 |     previousActionsString = `You have already taken the following actions: \n${serializedActions}\n\n`;
125 |   }
126 | 
127 |   let result = `The user requests the following task:
128 | 
129 | ${taskInstructions}
130 | 
131 | ${previousActionsString}
132 | 
133 | Current time: ${new Date().toLocaleString()}
134 | `;
135 |   if (pageContents) {
136 |     result += `
137 | Current page contents:
138 | ${pageContents}`;
139 |   }
140 |   return result;
141 | }
142 | 
143 | // make action compatible with vision agent
144 | // TODO: refactor dom agent so we don't need this
145 | function visionActionAdapter(action: ParsedResponseSuccess): Action {
146 |   const args = { ...action.parsedAction.args, uid: "" };
147 |   if ("elementId" in args) {
148 |     args.uid = args.elementId;
149 |   }
150 |   return {
151 |     thought: action.thought,
152 |     operation: {
153 |       name: action.parsedAction.name,
154 |       args,
155 |     } as Action["operation"],
156 |   };
157 | }
158 | 


--------------------------------------------------------------------------------
/src/helpers/dom-agent/parseResponse.ts:
--------------------------------------------------------------------------------
  1 | import { ActionPayload, availableActions } from "./availableActions";
  2 | 
  3 | export type ParsedResponseSuccess = {
  4 |   thought: string;
  5 |   action: string;
  6 |   parsedAction: ActionPayload;
  7 | };
  8 | 
  9 | export type ParsedResponse =
 10 |   | ParsedResponseSuccess
 11 |   | {
 12 |       error: string;
 13 |     };
 14 | 
 15 | // sometimes AI replies with a JSON wrapped in triple backticks
 16 | export function extractJsonFromMarkdown(input: string): string[] {
 17 |   // Create a regular expression to capture code wrapped in triple backticks
 18 |   const regex = /```(json)?\s*([\s\S]*?)\s*```/g;
 19 | 
 20 |   const results = [];
 21 |   let match;
 22 |   while ((match = regex.exec(input)) !== null) {
 23 |     // If 'json' is specified, add the content to the results array
 24 |     if (match[1] === "json") {
 25 |       results.push(match[2]);
 26 |     } else if (match[2].startsWith("{")) {
 27 |       results.push(match[2]);
 28 |     }
 29 |   }
 30 |   return results;
 31 | }
 32 | 
 33 | function parseFunctionCall(callString: string) {
 34 |   // First, match the function name and the arguments part
 35 |   const functionPattern = /(\w+)\(([\s\S]*)\)/;
 36 |   const matches = callString.match(functionPattern);
 37 | 
 38 |   if (!matches) {
 39 |     console.error("Input does not match a function call pattern.", callString);
 40 |     throw new Error("Input does not match a function call pattern.");
 41 |   }
 42 | 
 43 |   const [, name, argsPart] = matches;
 44 | 
 45 |   // Then, match the arguments inside the args part
 46 |   // This pattern looks for either strings (handling escaped quotes) or numbers as arguments
 47 |   const argsPattern = /(["'])(?:(?=(\\?))\2[\s\S])*?\1|\d+/g;
 48 |   const argsMatches = argsPart.match(argsPattern);
 49 | 
 50 |   // Process matched arguments to strip quotes and unescape characters
 51 |   const args = argsMatches
 52 |     ? argsMatches.map((arg: string) => {
 53 |         // Remove leading and trailing quotes if they exist and unescape characters
 54 |         if (
 55 |           (arg.startsWith(`"`) && arg.endsWith(`"`)) ||
 56 |           (arg.startsWith(`'`) && arg.endsWith(`'`))
 57 |         ) {
 58 |           arg = arg.slice(1, -1);
 59 |           return arg
 60 |             .replace(/\\'/g, `'`)
 61 |             .replace(/\\"/g, `"`)
 62 |             .replace(/\\\\/g, `\\`);
 63 |         }
 64 |         // Parse numbers directly
 65 |         return JSON.parse(arg);
 66 |       })
 67 |     : [];
 68 | 
 69 |   return { name, args };
 70 | }
 71 | 
 72 | export function parseResponse(text: string): ParsedResponse {
 73 |   let action;
 74 |   try {
 75 |     action = JSON.parse(text);
 76 |   } catch (_e) {
 77 |     try {
 78 |       action = JSON.parse(extractJsonFromMarkdown(text)[0]);
 79 |     } catch (_e) {
 80 |       throw new Error("Response does not contain valid JSON.");
 81 |     }
 82 |   }
 83 | 
 84 |   if (!action.thought) {
 85 |     return {
 86 |       error: "Invalid response: Thought not found in the model response.",
 87 |     };
 88 |   }
 89 | 
 90 |   if (!action.action) {
 91 |     return {
 92 |       error: "Invalid response: Action not found in the model response.",
 93 |     };
 94 |   }
 95 | 
 96 |   const thought = action.thought;
 97 |   const actionString = action.action;
 98 | 
 99 |   const { name: actionName, args: argsArray } = parseFunctionCall(actionString);
100 |   console.log(actionName, argsArray);
101 | 
102 |   const availableAction = availableActions.find(
103 |     (action) => action.name === actionName,
104 |   );
105 | 
106 |   if (!availableAction) {
107 |     return {
108 |       error: `Invalid action: "${actionName}" is not a valid action.`,
109 |     };
110 |   }
111 |   const parsedArgs: Record<string, number | string> = {};
112 | 
113 |   if (argsArray.length !== availableAction.args.length) {
114 |     return {
115 |       error: `Invalid number of arguments: Expected ${availableAction.args.length} for action "${actionName}", but got ${argsArray.length}.`,
116 |     };
117 |   }
118 | 
119 |   for (let i = 0; i < argsArray.length; i++) {
120 |     const arg = argsArray[i];
121 |     const expectedArg = availableAction.args[i];
122 | 
123 |     parsedArgs[expectedArg.name] = arg;
124 | 
125 |     // TODO: type-parsing is currently disabled because all our args are strings
126 |     // if (expectedArg.type === 'number') {
127 |     //   const numberValue = Number(arg);
128 | 
129 |     //   if (isNaN(numberValue)) {
130 |     //     return {
131 |     //       error: `Invalid argument type: Expected a number for argument "${expectedArg.name}", but got "${arg}".`,
132 |     //     };
133 |     //   }
134 | 
135 |     //   parsedArgs[expectedArg.name] = numberValue;
136 |     // } else if (expectedArg.type === 'string') {
137 |     //   parsedArgs[expectedArg.name] = arg;
138 |     // } else {
139 |     //   return {
140 |     //     // @ts-expect-error this is here to make sure we don't forget to update this code if we add a new arg type
141 |     //     error: `Invalid argument type: Unknown type "${expectedArg.type}" for argument "${expectedArg.name}".`,
142 |     //   };
143 |     // }
144 |   }
145 | 
146 |   const parsedAction = {
147 |     name: availableAction.name,
148 |     args: parsedArgs,
149 |   } as ActionPayload;
150 | 
151 |   return {
152 |     thought,
153 |     action: actionString,
154 |     parsedAction,
155 |   };
156 | }
157 | 


--------------------------------------------------------------------------------
/src/helpers/errorChecker.ts:
--------------------------------------------------------------------------------
 1 | import Anthropic from "@anthropic-ai/sdk";
 2 | import OpenAI from "openai";
 3 | import { debugMode } from "../constants";
 4 | 
 5 | // returns true if the error is recoverable by retrying the query
 6 | export default function errorChecker(
 7 |   err: Error,
 8 |   notifyError?: (errMsg: string) => void,
 9 | ): boolean {
10 |   const log = (msg: string, e: Error) => {
11 |     if (debugMode) {
12 |       console.error(msg, e);
13 |     }
14 |     if (notifyError) {
15 |       notifyError(msg);
16 |     }
17 |   };
18 |   if (err instanceof OpenAI.APIError) {
19 |     if (err instanceof OpenAI.InternalServerError) {
20 |       log(
21 |         "There is a problem with the OpenAI API server. Please check its status page https://status.openai.com/ and try again later.",
22 |         err,
23 |       );
24 |       return false;
25 |     }
26 |     if (
27 |       err instanceof OpenAI.AuthenticationError ||
28 |       err instanceof OpenAI.PermissionDeniedError
29 |     ) {
30 |       log("The OpenAI API key you provided might not be valid", err);
31 |       return false;
32 |     }
33 |     if (err instanceof OpenAI.APIConnectionError) {
34 |       log(
35 |         "There is a problem with the network connection to the OpenAI API. Please check your network connection and try again later.",
36 |         err,
37 |       );
38 |       return true;
39 |     }
40 |     // other API errors are not recoverable
41 |     return false;
42 |   } else if (err instanceof Anthropic.APIError) {
43 |     if (err instanceof Anthropic.InternalServerError) {
44 |       log(
45 |         "There is a problem with the Anthropic API server. Please check its status page https://status.anthropic.com/ and try again later.",
46 |         err,
47 |       );
48 |       return false;
49 |     }
50 |     if (
51 |       err instanceof Anthropic.AuthenticationError ||
52 |       err instanceof Anthropic.PermissionDeniedError
53 |     ) {
54 |       log("The Anthropic API key you provided might not be valid", err);
55 |       return false;
56 |     }
57 |     if (err instanceof Anthropic.APIConnectionError) {
58 |       log(
59 |         "There is a problem with the network connection to the Anthropic API. Please check your network connection and try again later.",
60 |         err,
61 |       );
62 |       return true;
63 |     }
64 |     // other API errors are not recoverable
65 |     return false;
66 |   }
67 |   log("Error: " + err.message, err);
68 |   // retry everything else (e.g. network errors, syntax error, timeout)
69 |   return true;
70 | }
71 | 


--------------------------------------------------------------------------------
/src/helpers/index.ts:
--------------------------------------------------------------------------------
1 | import { type ToolOperation } from "./vision-agent/tools";
2 | export { ToolOperation };
3 | export { DomActions } from "./rpc/domActions";
4 | export { callRPC, callRPCWithTab } from "./rpc/pageRPC";
5 | export { attachDebugger, detachDebugger } from "./chromeDebugger";
6 | import { operateTool, operateToolWithSelector } from "./rpc/performAction";
7 | export { operateTool, operateToolWithSelector };
8 | 


--------------------------------------------------------------------------------
/src/helpers/knowledge/db.json:
--------------------------------------------------------------------------------
  1 | {
  2 |   "x.com": {
  3 |     "rules": [
  4 |       {
  5 |         "regexes": [".*"],
  6 |         "knowledge": {
  7 |           "notes": [
  8 |             "The website X (formerly Twitter) is a social media platform. Many people still call it Twitter and use the term \"tweet\" to refer to a post.",
  9 |             "Do not confuse \"post\" with \"message\". A post is a public message that can be seen by anyone, while a message is a private message that can only be seen by the recipient."
 10 |           ]
 11 |         }
 12 |       },
 13 |       {
 14 |         "regexes": ["^/compose/post/?$"],
 15 |         "knowledge": {
 16 |           "notes": [
 17 |             "The \"Add post\" button is used to compose a thread. Do not confuse with the \"Post\" button that sends the composed tweet."
 18 |           ]
 19 |         }
 20 |       }
 21 |     ]
 22 |   },
 23 |   "calendar.google.com": {
 24 |     "rules": [
 25 |       {
 26 |         "regexes": [".*"],
 27 |         "knowledge": {
 28 |           "notes": [
 29 |             "The best way to create a new event on Google Calendar is to click on the \"Create\" button, then click on the \"Event\" option, then fill in the details in the form, and click on the \"Save\" button."
 30 |           ],
 31 |           "annotationRules": [
 32 |             {
 33 |               "selector": "[data-key]",
 34 |               "useAttributeAsName": "data-key",
 35 |               "allowInvisible": false,
 36 |               "allowCovered": true,
 37 |               "allowAriaHidden": false
 38 |             },
 39 |             {
 40 |               "selector": "[data-hovercard-id]",
 41 |               "useAttributeAsName": "data-hovercard-id",
 42 |               "allowInvisible": false,
 43 |               "allowCovered": false,
 44 |               "allowAriaHidden": false
 45 |             }
 46 |           ]
 47 |         }
 48 |       }
 49 |     ]
 50 |   },
 51 |   "airbnb.com": {
 52 |     "rules": [
 53 |       {
 54 |         "regexes": [".*"],
 55 |         "knowledge": {
 56 |           "annotationRules": [
 57 |             {
 58 |               "selector": "[data-testid=\"listing-card-title\"]",
 59 |               "allowInvisible": false,
 60 |               "allowCovered": true,
 61 |               "allowAriaHidden": true
 62 |             }
 63 |           ]
 64 |         }
 65 |       }
 66 |     ]
 67 |   },
 68 |   "amazon.com": {
 69 |     "rules": [
 70 |       {
 71 |         "regexes": [".*"],
 72 |         "knowledge": {
 73 |           "notes": [
 74 |             "Be careful not to confuse the \"Add to Cart\" with the \"Buy Now\". The \"Add to Cart\" button adds the item to the cart, while the \"Buy Now\" button takes you to the checkout page.",
 75 |             "Do not confuse \"Buy Now\" and \"Buy New\" on product page.",
 76 |             "You should always verify if the product is in stock before buying or adding to the cart. If the product is not in stock, you should notify the user about it."
 77 |           ]
 78 |         }
 79 |       },
 80 |       {
 81 |         "regexes": ["^/s$"],
 82 |         "knowledge": {
 83 |           "notes": [
 84 |             "There is no \"Add to Cart\" button on the search results page. You need to click on the product name to go to the product details page first."
 85 |           ]
 86 |         }
 87 |       }
 88 |     ]
 89 |   },
 90 |   "github.com": {
 91 |     "rules": [
 92 |       {
 93 |         "regexes": [
 94 |           ".*"
 95 |         ],
 96 |         "knowledge": {
 97 |           "notes": [
 98 |             "You can open the account menu by clicking the user's avatar on the top right. You can find and manage current user's profile, repositories, projects, organizations, etc. in the menu.",
 99 |             "To invite a member to an organization or a team, you need to first click \"Invite member\" or \"Invite someone\". When you see the dialog, type in the input to search by username or email, then click the button appear under the input that says \"[name] invite to [org]\". Please note that this does not actually send the invite: it only adds the user to the selection. You must then click the green \"Invite\" button to send the invitation."
100 |           ]
101 |         }
102 |       }
103 |     ]
104 |   }
105 | }
106 | 


--------------------------------------------------------------------------------
/src/helpers/knowledge/index.ts:
--------------------------------------------------------------------------------
  1 | import _db from "./db.json" assert { type: "json" };
  2 | import _redirects from "./redirects.json" assert { type: "json" };
  3 | 
  4 | type Redirects = {
  5 |   [host: string]: string;
  6 | };
  7 | export type AnnotationRule = {
  8 |   selector: string;
  9 |   useStaticName?: string;
 10 |   useAttributeAsName?: string;
 11 |   allowInvisible?: boolean;
 12 |   allowAriaHidden?: boolean;
 13 |   allowCovered?: boolean;
 14 | };
 15 | 
 16 | export type Knowledge = {
 17 |   notes?: string[];
 18 |   annotationRules?: AnnotationRule[];
 19 | };
 20 | 
 21 | export type Rule = {
 22 |   regexes: string[];
 23 |   knowledge: Knowledge;
 24 | };
 25 | 
 26 | export type Data = {
 27 |   [host: string]: {
 28 |     rules?: Rule[];
 29 |   };
 30 | };
 31 | 
 32 | // rule type used only in editing mode
 33 | export type EditingRule = Rule & {
 34 |   regexType: string;
 35 | };
 36 | 
 37 | // data type used only in editing mode
 38 | export type EditingData = {
 39 |   host: string;
 40 |   rules: EditingRule[];
 41 | };
 42 | 
 43 | export type LocationInfo = {
 44 |   host: string;
 45 |   pathname: string;
 46 | };
 47 | 
 48 | export function fetchKnowledge(
 49 |   location: LocationInfo,
 50 |   customKnowledgeBase?: Data,
 51 | ): Knowledge {
 52 |   // TODO: fetch from a server
 53 |   const data = _db as Data;
 54 |   const redirects = _redirects as Redirects;
 55 |   let result: Knowledge = {
 56 |     notes: [],
 57 |     annotationRules: [],
 58 |   };
 59 | 
 60 |   const { host, pathname } = location;
 61 |   const normalizedHosts = getNormalizedHosts(host, redirects);
 62 | 
 63 |   for (const searchHost of normalizedHosts) {
 64 |     const hostKnowledge = data[searchHost] || customKnowledgeBase?.[searchHost];
 65 |     if (hostKnowledge) {
 66 |       result = mergeKnowledge(result, hostKnowledge, pathname);
 67 |     }
 68 |   }
 69 | 
 70 |   return result;
 71 | }
 72 | 
 73 | function getNormalizedHosts(host: string, redirects: Redirects): string[] {
 74 |   const hostWithWww = host.startsWith("www.") ? host : `www.${host}`;
 75 |   const hostWithoutWww = host.startsWith("www.") ? host.slice(4) : host;
 76 |   const redirectedHostWithWww = redirects[hostWithWww] || hostWithWww;
 77 |   const redirectedHostWithoutWww = redirects[hostWithoutWww] || hostWithoutWww;
 78 |   return [
 79 |     ...new Set([
 80 |       hostWithWww,
 81 |       hostWithoutWww,
 82 |       redirectedHostWithWww,
 83 |       redirectedHostWithoutWww,
 84 |     ]),
 85 |   ];
 86 | }
 87 | 
 88 | function mergeKnowledge(
 89 |   result: Knowledge,
 90 |   dataSource: { rules?: Rule[] },
 91 |   pathname: string,
 92 | ): Knowledge {
 93 |   const rules = dataSource.rules;
 94 |   if (rules != null) {
 95 |     for (const rule of rules) {
 96 |       for (const regex of rule.regexes) {
 97 |         if (new RegExp(regex, "i").test(pathname)) {
 98 |           // merge all matching rules
 99 |           result.notes = result.notes?.concat(rule.knowledge.notes ?? []);
100 | 
101 |           // filter out invalid annotaion rules
102 |           const filteredAnnotationRules =
103 |             rule.knowledge.annotationRules?.filter(
104 |               (rule) => rule.selector !== "",
105 |             ) ?? [];
106 |           result.annotationRules = result.annotationRules?.concat(
107 |             filteredAnnotationRules,
108 |           );
109 |         }
110 |       }
111 |     }
112 |   }
113 |   return result;
114 | }
115 | 
116 | export function fetchAllDefaultKnowledge(): Data {
117 |   return _db as Data;
118 | }
119 | 


--------------------------------------------------------------------------------
/src/helpers/knowledge/redirects.json:
--------------------------------------------------------------------------------
1 | {
2 |   "twitter.com": "x.com",
3 |   "www.twitter.com": "x.com",
4 |   "www.x.com": "x.com",
5 |   "www.airbnb.com": "airbnb.com",
6 |   "www.amazon.com": "amazon.com"
7 | }
8 | 


--------------------------------------------------------------------------------
/src/helpers/rpc/pageRPC.ts:
--------------------------------------------------------------------------------
 1 | import { sleep } from "../utils";
 2 | import type { RPCMethods } from "../../pages/content/domOperations";
 3 | 
 4 | // Call these functions to execute code in the content script
 5 | 
 6 | function sendMessage<K extends keyof RPCMethods>(
 7 |   tabId: number,
 8 |   method: K,
 9 |   payload: Parameters<RPCMethods[K]>,
10 | ): Promise<ReturnType<RPCMethods[K]>> {
11 |   // Send a message to the other world
12 |   // Ensure that the method and arguments are correct according to RpcMethods
13 |   return new Promise((resolve, reject) => {
14 |     chrome.tabs.sendMessage(tabId, { method, payload }, (response) => {
15 |       if (chrome.runtime.lastError) {
16 |         reject(chrome.runtime.lastError);
17 |       } else {
18 |         resolve(response);
19 |       }
20 |     });
21 |   });
22 | }
23 | 
24 | export const callRPC = async <K extends keyof RPCMethods>(
25 |   method: K,
26 |   payload: Parameters<RPCMethods[K]>,
27 |   maxTries = 1,
28 | ): Promise<ReturnType<RPCMethods[K]>> => {
29 |   let queryOptions = { active: true, currentWindow: true };
30 |   let activeTab = (await chrome.tabs.query(queryOptions))[0];
31 | 
32 |   // If the active tab is a chrome-extension:// page, then we need to get some random other tab for testing
33 |   if (activeTab.url?.startsWith("chrome")) {
34 |     queryOptions = { active: false, currentWindow: true };
35 |     activeTab = (await chrome.tabs.query(queryOptions))[0];
36 |   }
37 | 
38 |   if (!activeTab?.id) throw new Error("No active tab found");
39 |   return callRPCWithTab(activeTab.id, method, payload, maxTries);
40 | };
41 | 
42 | export const callRPCWithTab = async <K extends keyof RPCMethods>(
43 |   tabId: number,
44 |   method: K,
45 |   payload: Parameters<RPCMethods[K]>,
46 |   maxTries = 2,
47 | ): Promise<ReturnType<RPCMethods[K]>> => {
48 |   // eslint-disable-next-line @typescript-eslint/no-explicit-any
49 |   let err: any;
50 |   for (let i = 0; i < maxTries; i++) {
51 |     try {
52 |       const response = await sendMessage(tabId, method, payload);
53 |       return response;
54 |     } catch (e) {
55 |       if (i === maxTries - 1) {
56 |         // Last try, throw the error
57 |         err = e;
58 |       } else {
59 |         // Content script may not have loaded, retry
60 |         console.error(e);
61 |         await sleep(1000);
62 |       }
63 |     }
64 |   }
65 |   throw err;
66 | };
67 | 


--------------------------------------------------------------------------------
/src/helpers/rpc/performAction.ts:
--------------------------------------------------------------------------------
  1 | import { DomActions } from "./domActions";
  2 | import {
  3 |   WEB_WAND_LABEL_ATTRIBUTE_NAME,
  4 |   VISIBLE_TEXT_ATTRIBUTE_NAME,
  5 | } from "../../constants";
  6 | import { sleep } from "../utils";
  7 | import { type ToolOperation } from "../vision-agent/tools";
  8 | 
  9 | function getSelector(label: string): string {
 10 |   return `[${WEB_WAND_LABEL_ATTRIBUTE_NAME}="${label}"]`;
 11 | }
 12 | 
 13 | function getFallbackSelector(selectorName: string): string {
 14 |   return `[${VISIBLE_TEXT_ATTRIBUTE_NAME}="${selectorName}"]`;
 15 | }
 16 | 
 17 | export async function clickWithSelector(
 18 |   domActions: DomActions,
 19 |   selector: string,
 20 | ): Promise<boolean> {
 21 |   console.log("clickWithSelector", selector);
 22 |   return await domActions.clickWithSelector({
 23 |     selector,
 24 |   });
 25 | }
 26 | 
 27 | export async function clickWithElementId(
 28 |   domActions: DomActions,
 29 |   elementId: string,
 30 | ): Promise<boolean> {
 31 |   console.log("clickWithElementId", elementId);
 32 |   return await domActions.clickWithElementId({
 33 |     elementId: parseInt(elementId),
 34 |   });
 35 | }
 36 | 
 37 | export async function clickWithLabel(
 38 |   domActions: DomActions,
 39 |   label: string,
 40 | ): Promise<boolean> {
 41 |   console.log("clickWithLabel", label);
 42 |   let success = false;
 43 |   try {
 44 |     success = await domActions.clickWithSelector({
 45 |       selector: `#${label}`,
 46 |     });
 47 |   } catch (e) {
 48 |     // `#${selectorName}` might not be valid
 49 |   }
 50 |   if (success) return true;
 51 |   success = await domActions.clickWithSelector({
 52 |     selector: getSelector(label),
 53 |   });
 54 |   if (success) return true;
 55 |   return await domActions.clickWithSelector({
 56 |     selector: getFallbackSelector(label),
 57 |   });
 58 | }
 59 | 
 60 | export async function setValueWithSelector(
 61 |   domActions: DomActions,
 62 |   selector: string,
 63 |   value: string,
 64 | ): Promise<boolean> {
 65 |   console.log("setValueWithSelector", selector);
 66 |   return await domActions.setValueWithSelector({
 67 |     selector,
 68 |     value,
 69 |   });
 70 | }
 71 | 
 72 | export async function setValueWithElementId(
 73 |   domActions: DomActions,
 74 |   elementId: string,
 75 |   value: string,
 76 | ): Promise<boolean> {
 77 |   console.log("setValueWithElementId", elementId);
 78 |   return await domActions.setValueWithElementId({
 79 |     elementId: parseInt(elementId),
 80 |     value,
 81 |   });
 82 | }
 83 | 
 84 | export async function setValueWithLabel(
 85 |   domActions: DomActions,
 86 |   label: string,
 87 |   value: string,
 88 | ): Promise<boolean> {
 89 |   console.log("setValueWithLabel", label);
 90 |   let success = false;
 91 |   try {
 92 |     success = await domActions.setValueWithSelector({
 93 |       selector: `#${label}`,
 94 |       value,
 95 |     });
 96 |   } catch (e) {
 97 |     // `#${selectorName}` might not be valid
 98 |   }
 99 |   if (success) return true;
100 |   success = await domActions.setValueWithSelector({
101 |     selector: getSelector(label),
102 |     value,
103 |   });
104 |   if (success) return true;
105 |   return await domActions.setValueWithSelector({
106 |     selector: getFallbackSelector(label),
107 |     value,
108 |   });
109 | }
110 | 
111 | export async function scroll(domActions: DomActions, value: string) {
112 |   switch (value) {
113 |     case "up":
114 |       await domActions.scrollUp();
115 |       break;
116 |     case "down":
117 |       await domActions.scrollDown();
118 |       break;
119 |     case "top":
120 |       await domActions.scrollToTop();
121 |       break;
122 |     case "bottom":
123 |       await domActions.scrollToBottom();
124 |       break;
125 |     default:
126 |       console.error("Invalid scroll value", value);
127 |   }
128 | }
129 | 
130 | function createOperateTool(
131 |   click: (domActions: DomActions, label: string) => Promise<boolean>,
132 |   setValue: (
133 |     domActions: DomActions,
134 |     label: string,
135 |     value: string,
136 |   ) => Promise<boolean>,
137 | ): (tabId: number, action: ToolOperation) => Promise<void> {
138 |   return async (tabId: number, action: ToolOperation) => {
139 |     const domActions = new DomActions(tabId);
140 |     console.log("operateTool", action);
141 |     switch (action.name) {
142 |       case "scroll":
143 |         await scroll(domActions, action.args.value);
144 |         break;
145 |       case "wait":
146 |         await sleep(3000);
147 |         break;
148 |       case "finish":
149 |         console.log("Action finished successfully.");
150 |         break;
151 |       case "fail":
152 |         console.warn("Action failed.");
153 |         break;
154 |       case "navigate":
155 |         console.log("Navigate to new page", action.args.url);
156 |         window.open(action.args.url, "_blank");
157 |         break;
158 |       case "click": {
159 |         const success = await click(domActions, action.args.uid);
160 |         if (!success) {
161 |           console.error("Unable to find element with uid: ", action.args.uid);
162 |         }
163 |         break;
164 |       }
165 |       case "setValue": {
166 |         const success = await setValue(
167 |           domActions,
168 |           action.args.uid,
169 |           action.args.value || "",
170 |         );
171 |         if (!success) {
172 |           console.error("Unable to find element with uid: ", action.args.uid);
173 |         }
174 |         break;
175 |       }
176 |       case "setValueAndEnter": {
177 |         const success = await setValue(
178 |           domActions,
179 |           action.args.uid,
180 |           (action.args.value || "") + "\n",
181 |         );
182 |         if (!success) {
183 |           console.error("Unable to find element with uid: ", action.args.uid);
184 |         }
185 |         break;
186 |       }
187 |       default:
188 |         console.error("Invalid action name", action);
189 |     }
190 |   };
191 | }
192 | 
193 | export const operateTool = createOperateTool(clickWithLabel, setValueWithLabel);
194 | 
195 | // DOM agent currently use this (using elementId instead of label)
196 | export const operateToolWithSimpliedDom = createOperateTool(
197 |   clickWithElementId,
198 |   setValueWithElementId,
199 | );
200 | 
201 | export const operateToolWithSelector = createOperateTool(
202 |   clickWithSelector,
203 |   setValueWithSelector,
204 | );
205 | 


--------------------------------------------------------------------------------
/src/helpers/rpc/runtimeFunctionStrings.ts:
--------------------------------------------------------------------------------
 1 | // TypeScript function
 2 | function scrollIntoViewFunction() {
 3 |   // @ts-expect-error this is run in the browser context
 4 |   this.scrollIntoView({
 5 |     block: "center",
 6 |     inline: "center",
 7 |     // behavior: 'smooth',
 8 |   });
 9 | }
10 | // Convert the TypeScript function to a string
11 | export const scrollScriptString = scrollIntoViewFunction.toString();
12 | 


--------------------------------------------------------------------------------
/src/helpers/rpc/utils.ts:
--------------------------------------------------------------------------------
 1 | import { DomActions } from "./domActions";
 2 | 
 3 | export async function waitTillHTMLRendered(
 4 |   tabId: number,
 5 |   interval = undefined,
 6 |   timeout = undefined,
 7 | ) {
 8 |   const domActions = new DomActions(tabId);
 9 |   return await domActions.waitTillHTMLRendered(interval, timeout);
10 | }
11 | 


--------------------------------------------------------------------------------
/src/helpers/shrinkHTML/tagsSelfClose.ts:
--------------------------------------------------------------------------------
1 | export const tagsSelfClose = (html: string) => {
2 |   // Regular expression to match empty elements
3 |   const re = /<([a-z]+)([^<]*?)><\/\1>/gi;
4 | 
5 |   // Replace empty elements with self-closing tags
6 |   const newHtml = html.replace(re, "<$1$2 />");
7 |   return newHtml;
8 | };
9 | 


--------------------------------------------------------------------------------
/src/helpers/shrinkHTML/templatize.test.ts:
--------------------------------------------------------------------------------
 1 | import { test } from "@jest/globals";
 2 | import templatize from "./templatize";
 3 | 
 4 | const sample = `
 5 | <body>
 6 | <div>
 7 | <a id="1242"></a>
 8 | <div>
 9 |   <div>
10 |     Lopez Island, Washington On the beach Sep 17 – 22 $350 per night
11 |     <span aria-label="5.0 out of 5 average rating"></span>
12 |   </div>
13 |   <div>
14 |     <button
15 |       aria-label="Add to wishlist: Lopez Island, Washington"
16 |       type="button"
17 |       id="1272"
18 |     ></button>
19 |     <div aria-label="Photo 1 of 6"></div>
20 |   </div>
21 | </div>
22 | </div>
23 | <div>
24 | <a id="1366"></a>
25 | <div>
26 |   <div>
27 |     Brinnon, Washington On the beach Apr 22 – 28 $317 per night
28 |     <span aria-label="4.97 out of 5 average rating"></span>
29 |   </div>
30 |   <div>
31 |     <button
32 |       aria-label="Add to wishlist: Brinnon, Washington"
33 |       type="button"
34 |       id="1396"
35 |     ></button>
36 |     <div aria-label="Photo 1 of 6"></div>
37 |   </div>
38 | </div>
39 | </div>
40 | <div>
41 | <a id="1490"></a>
42 | <div>
43 |   <div>
44 |     Lopez Island, Washington On the beach Aug 8 – 14 $534 per night
45 |     <span aria-label="4.9 out of 5 average rating"></span>
46 |   </div>
47 |   <div>
48 |     <button
49 |       aria-label="Add to wishlist: Lopez Island, Washington"
50 |       type="button"
51 |       id="1520"
52 |     ></button>
53 |     <div aria-label="Photo 1 of 6"></div>
54 |   </div>
55 | </div>
56 | </div>
57 | <div>
58 | <a id="1614"></a>
59 | <div>
60 |   <div>
61 |     Camano, Washington On the beach Jun 1 – 6 $910 per night
62 |     <span aria-label="4.72 out of 5 average rating"></span>
63 |   </div>
64 |   <div>
65 |     <button
66 |       aria-label="Add to wishlist: Camano, Washington"
67 |       type="button"
68 |       id="1644"
69 |     ></button>
70 |     <div aria-label="Photo 1 of 6"></div>
71 |   </div>
72 | </div>
73 | </body>
74 | `;
75 | 
76 | // test('templatize', () => {
77 | //   const out = templatize(sample);
78 | //   console.log('in length', sample.length);
79 | //   console.log('out length', out.length);
80 | //   console.log(out);
81 | //   expect(templatize(sample)).toBe(``);
82 | // });
83 | 
84 | test("templatize", () => {
85 |   // const dom = new DOMParser().parseFromString(sample, 'text/html');
86 | 
87 |   const out = templatize(sample);
88 |   // const out = templatize(dom.documentElement);
89 |   console.log(out);
90 | });
91 | 


--------------------------------------------------------------------------------
/src/helpers/simplifyDom.ts:
--------------------------------------------------------------------------------
 1 | import { callRPC } from "./rpc/pageRPC";
 2 | import { truthyFilter } from "./utils";
 3 | 
 4 | export async function getSimplifiedDom() {
 5 |   const fullDom = await callRPC("getAnnotatedDOM", [], 3);
 6 |   if (!fullDom || typeof fullDom !== "string") return null;
 7 | 
 8 |   const dom = new DOMParser().parseFromString(fullDom, "text/html");
 9 | 
10 |   // Mount the DOM to the document in an iframe so we can use getComputedStyle
11 | 
12 |   const interactiveElements: HTMLElement[] = [];
13 | 
14 |   const simplifiedDom = generateSimplifiedDom(
15 |     dom.documentElement,
16 |     interactiveElements,
17 |   ) as HTMLElement;
18 | 
19 |   return simplifiedDom;
20 | }
21 | 
22 | export function generateSimplifiedDom(
23 |   element: ChildNode,
24 |   interactiveElements: HTMLElement[],
25 | ): ChildNode | null {
26 |   if (element.nodeType === Node.TEXT_NODE && element.textContent?.trim()) {
27 |     return document.createTextNode(element.textContent + " ");
28 |   }
29 | 
30 |   if (!(element instanceof HTMLElement || element instanceof SVGElement))
31 |     return null;
32 | 
33 |   const isVisible = element.getAttribute("data-visible") === "true";
34 |   if (!isVisible) return null;
35 | 
36 |   let children = Array.from(element.childNodes)
37 |     .map((c) => generateSimplifiedDom(c, interactiveElements))
38 |     .filter(truthyFilter);
39 | 
40 |   // Don't bother with text that is the direct child of the body
41 |   if (element.tagName === "BODY")
42 |     children = children.filter((c) => c.nodeType !== Node.TEXT_NODE);
43 | 
44 |   const interactive =
45 |     element.getAttribute("data-interactive") === "true" ||
46 |     element.hasAttribute("role");
47 |   const hasLabel =
48 |     element.hasAttribute("aria-label") || element.hasAttribute("name");
49 |   const includeNode = interactive || hasLabel;
50 | 
51 |   if (!includeNode && children.length === 0) return null;
52 |   if (!includeNode && children.length === 1) {
53 |     return children[0];
54 |   }
55 | 
56 |   const container = document.createElement(element.tagName);
57 | 
58 |   const allowedAttributes = [
59 |     "aria-label",
60 |     "data-name",
61 |     "name",
62 |     "type",
63 |     "placeholder",
64 |     "value",
65 |     "role",
66 |     "title",
67 |   ];
68 | 
69 |   for (const attr of allowedAttributes) {
70 |     if (element.hasAttribute(attr)) {
71 |       container.setAttribute(attr, element.getAttribute(attr) as string);
72 |     }
73 |   }
74 |   if (interactive) {
75 |     interactiveElements.push(element as HTMLElement);
76 |     container.setAttribute("id", element.getAttribute("data-id") as string);
77 |   }
78 | 
79 |   children.forEach((child) => container.appendChild(child));
80 | 
81 |   return container;
82 | }
83 | 


--------------------------------------------------------------------------------
/src/helpers/utils.ts:
--------------------------------------------------------------------------------
 1 | export async function sleep(ms: number) {
 2 |   return new Promise((resolve) => setTimeout(resolve, ms));
 3 | }
 4 | 
 5 | export function truthyFilter<T>(value: T | null | undefined): value is T {
 6 |   return Boolean(value);
 7 | }
 8 | 
 9 | export async function waitFor(
10 |   predicate: () => Promise<boolean>,
11 |   interval: number,
12 |   _maxChecks: number,
13 |   rejectOnTimeout = true,
14 | ): Promise<void> {
15 |   // special case for 0 maxChecks (wait forever)
16 |   const maxChecks = _maxChecks === 0 ? Infinity : _maxChecks;
17 |   let checkCount = 0;
18 |   return new Promise((resolve, reject) => {
19 |     const intervalId = setInterval(async () => {
20 |       if (await predicate()) {
21 |         clearInterval(intervalId);
22 |         resolve();
23 |       } else {
24 |         checkCount++;
25 |         if (checkCount >= maxChecks) {
26 |           clearInterval(intervalId);
27 |           if (rejectOnTimeout) {
28 |             reject(new Error("Timed out waiting for condition"));
29 |           } else {
30 |             resolve();
31 |           }
32 |         }
33 |       }
34 |     }, interval);
35 |   });
36 | }
37 | 
38 | export async function waitTillStable(
39 |   getSize: () => Promise<number>,
40 |   interval: number,
41 |   timeout: number,
42 |   rejectOnTimeout = false, // default to assuming stable after timeout
43 | ): Promise<void> {
44 |   let lastSize = 0;
45 |   let countStableSizeIterations = 0;
46 |   const minStableSizeIterations = 3;
47 | 
48 |   return waitFor(
49 |     async () => {
50 |       const currentSize = await getSize();
51 | 
52 |       console.log("last: ", lastSize, " <> curr: ", currentSize);
53 | 
54 |       if (lastSize != 0 && currentSize === lastSize) {
55 |         countStableSizeIterations++;
56 |       } else {
57 |         countStableSizeIterations = 0; //reset the counter
58 |       }
59 | 
60 |       if (countStableSizeIterations >= minStableSizeIterations) {
61 |         console.log("Size stable! Assume fully rendered..");
62 |         return true;
63 |       }
64 | 
65 |       lastSize = currentSize;
66 |       return false;
67 |     },
68 |     interval,
69 |     timeout / interval,
70 |     rejectOnTimeout,
71 |   );
72 | }
73 | 
74 | export function enumKeys<O extends object, K extends keyof O = keyof O>(
75 |   obj: O,
76 | ): K[] {
77 |   return Object.keys(obj) as K[];
78 | }
79 | 
80 | export function enumValues<O extends object>(obj: O): O[keyof O][] {
81 |   return enumKeys(obj).map((key) => obj[key]);
82 | }
83 | 


--------------------------------------------------------------------------------
/src/helpers/vision-agent/determineNavigateAction.ts:
--------------------------------------------------------------------------------
  1 | import { parseResponse } from "./parseResponse";
  2 | import { QueryResult } from "./determineNextAction";
  3 | import { useAppState } from "../../state/store";
  4 | import errorChecker from "../errorChecker";
  5 | import { fetchResponseFromModel } from "../aiSdkUtils";
  6 | 
  7 | import { schemaToDescription, navigateSchema } from "./tools";
  8 | 
  9 | const navigateSchemaDescription = schemaToDescription(navigateSchema);
 10 | 
 11 | const systemMessage = (voiceMode: boolean) => `
 12 | You are a browser automation assistant.
 13 | 
 14 | You can use the following tool:
 15 | 
 16 | ${navigateSchemaDescription}
 17 | 
 18 | You will have access to more tools as you progress through the task.
 19 | 
 20 | You will be given a task to perform.
 21 | This is an example of expected response from you:
 22 | 
 23 | {
 24 |   "thought": "To find latest news on AI, I am navigating to Google.",${
 25 |     voiceMode
 26 |       ? `,
 27 |   "speak": "To find the latest news on AI, I am navigating to Google."`
 28 |       : ""
 29 |   }
 30 |   "action": {
 31 |     "name": "navigate",
 32 |     "args": {
 33 |       "url": "https://www.google.com/"
 34 |     }
 35 |   }
 36 | }
 37 | 
 38 | Your response must always be in JSON format and must include string "thought"${
 39 |   voiceMode ? ', string "speak",' : ""
 40 | } and object "action", which contains the string "name" of tool of choice, and necessary arguments ("args") if required by the tool.
 41 | `;
 42 | 
 43 | export async function determineNavigateAction(
 44 |   taskInstructions: string,
 45 |   maxAttempts = 3,
 46 |   notifyError?: (error: string) => void,
 47 | ): Promise<QueryResult> {
 48 |   const model = useAppState.getState().settings.selectedModel;
 49 |   const voiceMode = useAppState.getState().settings.voiceMode;
 50 |   const prompt = formatPrompt(taskInstructions);
 51 | 
 52 |   for (let i = 0; i < maxAttempts; i++) {
 53 |     try {
 54 |       const completion = await fetchResponseFromModel(model, {
 55 |         systemMessage: systemMessage(voiceMode),
 56 |         prompt,
 57 |         jsonMode: true,
 58 |       });
 59 | 
 60 |       const rawResponse = completion.rawResponse;
 61 |       let action = null;
 62 |       try {
 63 |         action = parseResponse(rawResponse);
 64 |       } catch (e) {
 65 |         console.error(e);
 66 |         // TODO: try use LLM to fix format when response is not valid
 67 |         throw new Error(`Incorrectly formatted response: ${e}`);
 68 |       }
 69 | 
 70 |       return {
 71 |         usage: completion.usage,
 72 |         prompt,
 73 |         rawResponse,
 74 |         action,
 75 |       };
 76 |       // eslint-disable-next-line @typescript-eslint/no-explicit-any
 77 |     } catch (error: any) {
 78 |       if (error instanceof Error) {
 79 |         const recoverable = errorChecker(error, notifyError);
 80 |         if (!recoverable) {
 81 |           throw error;
 82 |         }
 83 |       } else {
 84 |         console.error("Unexpected determineNextAction error:");
 85 |         console.error(error);
 86 |       }
 87 |     }
 88 |   }
 89 |   const errMsg = `Failed to complete query after ${maxAttempts} attempts. Please try again later.`;
 90 |   if (notifyError) {
 91 |     notifyError(errMsg);
 92 |   }
 93 |   throw new Error(errMsg);
 94 | }
 95 | 
 96 | export function formatPrompt(taskInstructions: string) {
 97 |   return `The user requests the following task:
 98 | 
 99 | ${taskInstructions}
100 | 
101 | Current time: ${new Date().toLocaleString()}
102 | `;
103 | }
104 | 


--------------------------------------------------------------------------------
/src/helpers/vision-agent/parseResponse.ts:
--------------------------------------------------------------------------------
 1 | import { toolSchemaUnion, type ToolOperation } from "./tools";
 2 | import { fromError } from "zod-validation-error";
 3 | 
 4 | export type Action = {
 5 |   thought: string;
 6 |   speak?: string;
 7 |   operation: ToolOperation;
 8 | };
 9 | 
10 | // sometimes AI replies with a JSON wrapped in triple backticks
11 | export function extractJsonFromMarkdown(input: string): string[] {
12 |   // Create a regular expression to capture code wrapped in triple backticks
13 |   const regex = /```(json)?\s*([\s\S]*?)\s*```/g;
14 | 
15 |   const results = [];
16 |   let match;
17 |   while ((match = regex.exec(input)) !== null) {
18 |     // If 'json' is specified, add the content to the results array
19 |     if (match[1] === "json") {
20 |       results.push(match[2]);
21 |     } else if (match[2].startsWith("{")) {
22 |       results.push(match[2]);
23 |     }
24 |   }
25 |   return results;
26 | }
27 | 
28 | export function parseResponse(rawResponse: string): Action {
29 |   let response;
30 |   try {
31 |     response = JSON.parse(rawResponse);
32 |   } catch (_e) {
33 |     try {
34 |       response = JSON.parse(extractJsonFromMarkdown(rawResponse)[0]);
35 |     } catch (_e) {
36 |       throw new Error("Response does not contain valid JSON.");
37 |     }
38 |   }
39 |   if (response.thought == null || response.action == null) {
40 |     throw new Error("Invalid response: Thought and Action are required");
41 |   }
42 |   let operation;
43 |   try {
44 |     operation = toolSchemaUnion.parse(response.action);
45 |   } catch (err) {
46 |     const validationError = fromError(err);
47 |     // user friendly error message
48 |     throw new Error(validationError.toString());
49 |   }
50 |   if ("speak" in response) {
51 |     return {
52 |       thought: response.thought,
53 |       speak: response.speak,
54 |       operation,
55 |     };
56 |   } else {
57 |     return {
58 |       thought: response.thought,
59 |       operation,
60 |     };
61 |   }
62 | }
63 | 


--------------------------------------------------------------------------------
/src/helpers/vision-agent/tools.ts:
--------------------------------------------------------------------------------
  1 | import { z } from "zod";
  2 | 
  3 | export const clickSchema = z.object({
  4 |   name: z.literal("click"),
  5 |   description: z
  6 |     .literal("Click on an element with the uid on the annotation.")
  7 |     .optional(),
  8 |   args: z.object({
  9 |     uid: z.string(),
 10 |   }),
 11 | });
 12 | 
 13 | export const setValueSchema = z.object({
 14 |   name: z.literal("setValue"),
 15 |   description: z
 16 |     .literal(
 17 |       "Focus on and set the value of an input element with the uid on the annotation.",
 18 |     )
 19 |     .optional(),
 20 |   args: z.object({
 21 |     uid: z.string(),
 22 |     value: z.string(),
 23 |   }),
 24 | });
 25 | 
 26 | export const setValueAndEnterSchema = z.object({
 27 |   name: z.literal("setValueAndEnter"),
 28 |   description: z
 29 |     .literal(
 30 |       'Like "setValue", except then it presses ENTER. Use this tool can submit the form when there\'s no "submit" button.',
 31 |     )
 32 |     .optional(),
 33 |   args: z.object({
 34 |     uid: z.string(),
 35 |     value: z.string(),
 36 |   }),
 37 | });
 38 | 
 39 | export const navigateSchema = z.object({
 40 |   name: z.literal("navigate"),
 41 |   description: z
 42 |     .literal(
 43 |       "Navigate to a new page. The value should be a URL. Use this tool only when the current task requires navigating to a new page.",
 44 |     )
 45 |     .optional(),
 46 |   args: z.object({
 47 |     url: z.string(),
 48 |   }),
 49 | });
 50 | 
 51 | export const scrollSchema = z.object({
 52 |   name: z.literal("scroll"),
 53 |   description: z
 54 |     .literal(
 55 |       'Scroll the page to see the other parts. Use "up" or "down" to scroll 2/3 of height of the window. Use "top" or "bottom" to quickly scroll to the top or bottom of the page.',
 56 |     )
 57 |     .optional(),
 58 |   args: z.object({
 59 |     value: z.string(),
 60 |   }),
 61 | });
 62 | 
 63 | export const waitSchema = z.object({
 64 |   name: z.literal("wait"),
 65 |   description: z
 66 |     .literal(
 67 |       "Wait for 3 seconds before the next action. Useful when the page is loading.",
 68 |     )
 69 |     .optional(),
 70 |   args: z.object({}).optional(),
 71 | });
 72 | 
 73 | export const finishSchema = z.object({
 74 |   name: z.literal("finish"),
 75 |   description: z.literal("Indicate the task is finished").optional(),
 76 |   args: z.object({}).optional(),
 77 | });
 78 | 
 79 | export const failSchema = z.object({
 80 |   name: z.literal("fail"),
 81 |   description: z
 82 |     .literal("Indicate that you are unable to complete the task")
 83 |     .optional(),
 84 |   args: z.object({}).optional(),
 85 | });
 86 | 
 87 | export const toolSchemaUnion = z.discriminatedUnion("name", [
 88 |   clickSchema,
 89 |   setValueSchema,
 90 |   setValueAndEnterSchema,
 91 |   navigateSchema,
 92 |   scrollSchema,
 93 |   waitSchema,
 94 |   finishSchema,
 95 |   failSchema,
 96 | ]);
 97 | const allTools = toolSchemaUnion.options;
 98 | type ToolSchema = (typeof allTools)[number];
 99 | 
100 | export type ToolOperation = z.infer<typeof toolSchemaUnion>;
101 | 
102 | export function schemaToDescription(schema: ToolSchema): string {
103 |   let description = "";
104 |   const shape = schema.shape;
105 |   const name = shape.name._def.value;
106 |   const descriptionText = shape.description.unwrap()._def.value;
107 |   description += `Name: ${name}\nDescription: ${descriptionText}\n`;
108 | 
109 |   const args = shape.args;
110 |   // If the tool has arguments, list them. If entire args is ZodOptional, there are no arguments.
111 |   if (args instanceof z.ZodObject && Object.keys(args.shape).length > 0) {
112 |     description += "Arguments:\n";
113 |     Object.entries(args.shape).forEach(([key, value]) => {
114 |       const argType = value instanceof z.ZodString ? "string" : "unknown";
115 |       description += `  - ${key} (${argType})\n`;
116 |     });
117 |   } else {
118 |     description += "No arguments.\n";
119 |   }
120 | 
121 |   return description;
122 | }
123 | 
124 | function getAllToolsDescriptions(): string {
125 |   return allTools.map(schemaToDescription).join("\n");
126 | }
127 | export const allToolsDescriptions = getAllToolsDescriptions();
128 | 


--------------------------------------------------------------------------------
/src/helpers/voiceControl.ts:
--------------------------------------------------------------------------------
  1 | import { useAppState } from "../state/store";
  2 | import OpenAI from "openai";
  3 | 
  4 | type SetTranscriptionFunction = (transcript: string, isFinal: boolean) => void;
  5 | 
  6 | class VoiceControlManager {
  7 |   private recognition: SpeechRecognition | null;
  8 |   private cumulativeTranscript = "";
  9 |   private setTranscription: SetTranscriptionFunction | null = null;
 10 | 
 11 |   constructor() {
 12 |     const SpeechRecognition =
 13 |       window.SpeechRecognition || window.webkitSpeechRecognition;
 14 |     if (SpeechRecognition) {
 15 |       this.recognition = new SpeechRecognition();
 16 |       this.recognition.continuous = true;
 17 |       this.recognition.interimResults = true;
 18 |       this.recognition.lang = "en-US";
 19 | 
 20 |       this.recognition.onresult = (event) => {
 21 |         let interimTranscript = "";
 22 |         for (let i = event.resultIndex; i < event.results.length; ++i) {
 23 |           if (event.results[i].isFinal) {
 24 |             const transcript = event.results[i][0].transcript;
 25 |             this.cumulativeTranscript += transcript.trim() + " ";
 26 |           } else {
 27 |             interimTranscript += event.results[i][0].transcript;
 28 |           }
 29 |         }
 30 |         if (this.setTranscription) {
 31 |           this.setTranscription(
 32 |             this.cumulativeTranscript + interimTranscript,
 33 |             false,
 34 |           );
 35 |         }
 36 |       };
 37 | 
 38 |       this.recognition.onerror = (event) => {
 39 |         console.error("Speech recognition error:", event.error);
 40 |       };
 41 |     } else {
 42 |       console.error("Browser does not support Speech Recognition.");
 43 |       this.recognition = null;
 44 |     }
 45 |   }
 46 | 
 47 |   public startListening = async (): Promise<void> => {
 48 |     if (!this.recognition) {
 49 |       console.error("Speech Recognition is not initialized.");
 50 |       return;
 51 |     }
 52 | 
 53 |     this.cumulativeTranscript = "";
 54 |     this.setTranscription = useAppState.getState().ui.actions.setInstructions;
 55 |     this.recognition.start();
 56 |   };
 57 | 
 58 |   public stopListening = (): void => {
 59 |     if (this.recognition) {
 60 |       this.recognition.stop();
 61 |     }
 62 |     if (this.setTranscription && this.cumulativeTranscript !== "") {
 63 |       this.setTranscription(this.cumulativeTranscript, true);
 64 |     }
 65 |     this.setTranscription = null;
 66 |   };
 67 | 
 68 |   public basicSpeak = (text: string): void => {
 69 |     const utterance = new SpeechSynthesisUtterance(text);
 70 |     utterance.rate = 2;
 71 |     speechSynthesis.speak(utterance);
 72 |   };
 73 | 
 74 |   public speak = async (text: string, onError: (error: string) => void) => {
 75 |     const key = useAppState.getState().settings.openAIKey ?? undefined;
 76 |     const openai = new OpenAI({
 77 |       apiKey: key,
 78 |       dangerouslyAllowBrowser: true,
 79 |     });
 80 | 
 81 |     try {
 82 |       const mp3Response = await openai.audio.speech.create({
 83 |         model: "tts-1",
 84 |         voice: "nova",
 85 |         input: text,
 86 |         speed: 1,
 87 |       });
 88 |       const arrayBuffer = await mp3Response.arrayBuffer();
 89 |       const blob = new Blob([arrayBuffer], { type: "audio/mp3" });
 90 |       const audioUrl = URL.createObjectURL(blob);
 91 |       const audio = new Audio(audioUrl);
 92 |       audio.play();
 93 |       // eslint-disable-next-line @typescript-eslint/no-explicit-any
 94 |     } catch (error: any) {
 95 |       console.error("Error generating or playing speech:", error);
 96 |       onError(error.message);
 97 |     }
 98 |   };
 99 | }
100 | 
101 | export const voiceControl = new VoiceControlManager();
102 | 


--------------------------------------------------------------------------------
/src/pages/background/index.ts:
--------------------------------------------------------------------------------
 1 | import reloadOnUpdate from "virtual:reload-on-update-in-background-script";
 2 | import "webextension-polyfill";
 3 | 
 4 | reloadOnUpdate("pages/background");
 5 | 
 6 | /**
 7 |  * Extension reloading is necessary because the browser automatically caches the css.
 8 |  * If you do not use the css of the content script, please delete it.
 9 |  */
10 | reloadOnUpdate("pages/content/style.scss");
11 | 
12 | console.log("background loaded");
13 | 
14 | // Allows users to open the side panel by clicking on the action toolbar icon
15 | chrome.sidePanel
16 |   .setPanelBehavior({ openPanelOnActionClick: true })
17 |   .catch((error) => console.error(error));
18 | 
19 | chrome.runtime.onMessage.addListener((message) => {
20 |   if (message.action === "injectFunctions") {
21 |     if (message.tabId == null) {
22 |       console.log("no active tab found");
23 |     } else {
24 |       chrome.scripting.executeScript({
25 |         target: { tabId: message.tabId },
26 |         files: ["assets/js/mainWorld.js"],
27 |         world: "MAIN",
28 |       });
29 |     }
30 |     return true;
31 |   }
32 | });
33 | 


--------------------------------------------------------------------------------
/src/pages/content/attachFile.ts:
--------------------------------------------------------------------------------
 1 | function base64ToBlob(base64: string, mimeType = "") {
 2 |   const byteCharacters = atob(base64);
 3 |   const byteNumbers = Array.from(byteCharacters, (char) => char.charCodeAt(0));
 4 |   const byteArray = new Uint8Array(byteNumbers);
 5 |   return new Blob([byteArray], { type: mimeType });
 6 | }
 7 | 
 8 | export default function attachFile(data: string, selector: string) {
 9 |   const screenshotBlob = base64ToBlob(data, "image/png");
10 |   // Create a virtual input element
11 |   const input = document.createElement("input");
12 |   input.type = "file";
13 |   input.style.display = "none";
14 | 
15 |   // Append to the document
16 |   document.body.appendChild(input);
17 | 
18 |   // Simulate file input for the screenshot blob
19 |   const dataTransfer = new DataTransfer();
20 |   dataTransfer.items.add(new File([screenshotBlob], "screenshot.png"));
21 |   input.files = dataTransfer.files;
22 | 
23 |   // Find the actual file input on the page and set its files property
24 |   const actualFileInput = document.querySelector(selector) as HTMLInputElement;
25 |   console.log(actualFileInput, selector);
26 |   if (!actualFileInput) {
27 |     console.log("could not find file input");
28 |     return;
29 |   }
30 |   actualFileInput.files = input.files;
31 |   console.log(actualFileInput.files);
32 | 
33 |   actualFileInput.dispatchEvent(
34 |     new Event("input", { bubbles: true, composed: true }),
35 |   );
36 |   actualFileInput.dispatchEvent(new Event("change", { bubbles: true }));
37 | 
38 |   // Clean up
39 |   document.body.removeChild(input);
40 | }
41 | 


--------------------------------------------------------------------------------
/src/pages/content/copyToClipboard.ts:
--------------------------------------------------------------------------------
1 | // copy provided text to clipboard
2 | export async function copyToClipboard(text: string) {
3 |   await navigator.clipboard.writeText(text);
4 | }
5 | 


--------------------------------------------------------------------------------
/src/pages/content/domOperations.ts:
--------------------------------------------------------------------------------
 1 | // The content script runs inside each page this extension is enabled on
 2 | // Do NOT import from here from outside of content script (other than types).
 3 | 
 4 | import getAnnotatedDOM, { getUniqueElementSelectorId } from "./getAnnotatedDOM";
 5 | import { copyToClipboard } from "./copyToClipboard";
 6 | import attachFile from "./attachFile";
 7 | import { drawLabels, removeLabels } from "./drawLabels";
 8 | import ripple from "./ripple";
 9 | import { getDataFromRenderedMarkdown } from "./reverseMarkdown";
10 | import getViewportPercentage from "./getViewportPercentage";
11 | import { injectMicrophonePermissionIframe } from "./permission";
12 | 
13 | function clickWithSelector(selector: string) {
14 |   const element = document.querySelector(selector) as HTMLElement;
15 |   // get center coordinates of the element
16 |   const { x, y } = element.getBoundingClientRect();
17 |   const centerX = x + element.offsetWidth / 2;
18 |   const centerY = y + element.offsetHeight / 2;
19 |   ripple(centerX, centerY);
20 |   if (element) {
21 |     element.click();
22 |   }
23 | }
24 | 
25 | export const rpcMethods = {
26 |   clickWithSelector,
27 |   getAnnotatedDOM,
28 |   getUniqueElementSelectorId,
29 |   ripple,
30 |   copyToClipboard,
31 |   attachFile,
32 |   drawLabels,
33 |   removeLabels,
34 |   getDataFromRenderedMarkdown,
35 |   getViewportPercentage,
36 |   injectMicrophonePermissionIframe,
37 | } as const;
38 | 
39 | export type RPCMethods = typeof rpcMethods;
40 | type MethodName = keyof RPCMethods;
41 | 
42 | export type RPCMessage = {
43 |   [K in MethodName]: {
44 |     method: K;
45 |     payload: Parameters<RPCMethods[K]>;
46 |   };
47 | }[MethodName];
48 | 
49 | // This function should run in the content script
50 | export const initializeRPC = () => {
51 |   chrome.runtime.onMessage.addListener(
52 |     (message: RPCMessage, sender, sendResponse): true | undefined => {
53 |       const { method, payload } = message;
54 |       console.log("RPC listener", method);
55 |       if (method in rpcMethods) {
56 |         // @ts-expect-error - we know this is valid (see pageRPC)
57 |         const resp = rpcMethods[method as keyof RPCMethods](...payload);
58 |         if (resp instanceof Promise) {
59 |           resp.then((resolvedResp) => {
60 |             sendResponse(resolvedResp);
61 |           });
62 |         } else {
63 |           sendResponse(resp);
64 |         }
65 |         return true;
66 |       }
67 |     },
68 |   );
69 | };
70 | 


--------------------------------------------------------------------------------
/src/pages/content/getAnnotatedDOM.ts:
--------------------------------------------------------------------------------
 1 | import { TAXY_ELEMENT_SELECTOR } from "../../constants";
 2 | 
 3 | function isInteractive(
 4 |   element: HTMLElement,
 5 |   style: CSSStyleDeclaration,
 6 | ): boolean {
 7 |   return (
 8 |     element.tagName === "A" ||
 9 |     element.tagName === "INPUT" ||
10 |     element.tagName === "BUTTON" ||
11 |     element.tagName === "SELECT" ||
12 |     element.tagName === "TEXTAREA" ||
13 |     element.hasAttribute("onclick") ||
14 |     element.hasAttribute("onmousedown") ||
15 |     element.hasAttribute("onmouseup") ||
16 |     element.hasAttribute("onkeydown") ||
17 |     element.hasAttribute("onkeyup") ||
18 |     style.cursor === "pointer"
19 |   );
20 | }
21 | 
22 | function isVisible(element: HTMLElement, style: CSSStyleDeclaration): boolean {
23 |   return (
24 |     style.opacity !== "" &&
25 |     style.display !== "none" &&
26 |     style.visibility !== "hidden" &&
27 |     style.opacity !== "0" &&
28 |     element.getAttribute("aria-hidden") !== "true"
29 |   );
30 | }
31 | 
32 | let currentElements: HTMLElement[] = [];
33 | 
34 | function traverseDOM(node: Node, pageElements: HTMLElement[]) {
35 |   const clonedNode = node.cloneNode(false) as Node;
36 | 
37 |   if (node.nodeType === Node.ELEMENT_NODE) {
38 |     const element = node as HTMLElement;
39 |     const style = window.getComputedStyle(element);
40 | 
41 |     const clonedElement = clonedNode as HTMLElement;
42 | 
43 |     pageElements.push(element);
44 |     clonedElement.setAttribute("data-id", (pageElements.length - 1).toString());
45 |     clonedElement.setAttribute(
46 |       "data-interactive",
47 |       isInteractive(element, style).toString(),
48 |     );
49 |     clonedElement.setAttribute(
50 |       "data-visible",
51 |       isVisible(element, style).toString(),
52 |     );
53 |   }
54 | 
55 |   node.childNodes.forEach((child) => {
56 |     const result = traverseDOM(child, pageElements);
57 |     clonedNode.appendChild(result.clonedDOM);
58 |   });
59 | 
60 |   return {
61 |     pageElements,
62 |     clonedDOM: clonedNode,
63 |   };
64 | }
65 | 
66 | /**
67 |  * getAnnotatedDom returns the pageElements array and a cloned DOM
68 |  * with data-pe-idx attributes added to each element in the copy.
69 |  */
70 | export default function getAnnotatedDOM() {
71 |   currentElements = [];
72 |   const result = traverseDOM(document.documentElement, currentElements);
73 |   return (result.clonedDOM as HTMLElement).outerHTML;
74 | }
75 | 
76 | // idempotent function to get a unique id for an element
77 | export function getUniqueElementSelectorId(id: number): string {
78 |   const element = currentElements[id];
79 |   // element may already have a unique id
80 |   let uniqueId = element.getAttribute(TAXY_ELEMENT_SELECTOR);
81 |   if (uniqueId) return uniqueId;
82 |   uniqueId = Math.random().toString(36).substring(2, 10);
83 |   element.setAttribute(TAXY_ELEMENT_SELECTOR, uniqueId);
84 |   return uniqueId;
85 | }
86 | 


--------------------------------------------------------------------------------
/src/pages/content/getViewportPercentage.ts:
--------------------------------------------------------------------------------
 1 | export default function getViewportPercentage(): number {
 2 |   // Total height of the document
 3 |   const documentHeight: number = Math.max(
 4 |     document.body.scrollHeight,
 5 |     document.body.offsetHeight,
 6 |     document.documentElement.clientHeight,
 7 |     document.documentElement.scrollHeight,
 8 |     document.documentElement.offsetHeight,
 9 |   );
10 | 
11 |   // Viewport height
12 |   const viewportHeight: number = window.innerHeight;
13 |   // How much has been scrolled
14 |   const scrollY: number = window.scrollY;
15 | 
16 |   // Calculate the end of the current viewport position as a percentage of the total document height
17 |   const percentage: number =
18 |     ((scrollY + viewportHeight) / documentHeight) * 100;
19 | 
20 |   return percentage;
21 | }
22 | 


--------------------------------------------------------------------------------
/src/pages/content/index.ts:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * DO NOT USE import someModule from '...';
 3 |  *
 4 |  * @issue-url https://github.com/Jonghakseo/chrome-extension-boilerplate-react-vite/issues/160
 5 |  *
 6 |  * Chrome extensions don't support modules in content scripts.
 7 |  * If you want to use other modules in content scripts, you need to import them via these files.
 8 |  *
 9 |  */
10 | import("@pages/content/injected");
11 | 


--------------------------------------------------------------------------------
/src/pages/content/injected.ts:
--------------------------------------------------------------------------------
1 | // The content script runs inside each page this extension is enabled on
2 | 
3 | import { initializeRPC } from "./domOperations";
4 | 
5 | initializeRPC();
6 | 


--------------------------------------------------------------------------------
/src/pages/content/mainWorld/index.ts:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * DO NOT USE import someModule from '...';
 3 |  *
 4 |  * @issue-url https://github.com/Jonghakseo/chrome-extension-boilerplate-react-vite/issues/160
 5 |  *
 6 |  * Chrome extensions don't support modules in content scripts.
 7 |  * If you want to use other modules in content scripts, you need to import them via these files.
 8 |  *
 9 |  */
10 | import("@pages/content/mainWorld/mainWorld");
11 | 


--------------------------------------------------------------------------------
/src/pages/content/mainWorld/mainWorld.ts:
--------------------------------------------------------------------------------
 1 | // This file will be inject dynamically into the page as a content script running in the context of the page
 2 | // see Background/index.ts for how this is done
 3 | 
 4 | import { debugMode } from "@src/constants";
 5 | import { generateSimplifiedDom } from "@src/helpers/simplifyDom";
 6 | import getAnnotatedDOM from "../getAnnotatedDOM";
 7 | import { rpcMethods } from "../domOperations";
 8 | 
 9 | async function getSimplifiedDomFromPage() {
10 |   const fullDom = getAnnotatedDOM();
11 |   if (!fullDom || typeof fullDom !== "string") return null;
12 | 
13 |   const dom = new DOMParser().parseFromString(fullDom, "text/html");
14 | 
15 |   // Mount the DOM to the document in an iframe so we can use getComputedStyle
16 | 
17 |   const interactiveElements: HTMLElement[] = [];
18 | 
19 |   const simplifiedDom = generateSimplifiedDom(
20 |     dom.documentElement,
21 |     interactiveElements,
22 |   ) as HTMLElement;
23 | 
24 |   if (!simplifiedDom) {
25 |     return null;
26 |   }
27 |   return simplifiedDom.outerHTML;
28 | }
29 | 
30 | if (debugMode) {
31 |   console.log("debug mode enabled");
32 |   // @ts-expect-error - this is for debugging only
33 |   window.WW_RPC_METHODS = {
34 |     getSimplifiedDomFromPage,
35 |     ...rpcMethods,
36 |   };
37 | }
38 | 


--------------------------------------------------------------------------------
/src/pages/content/permission.ts:
--------------------------------------------------------------------------------
1 | export const injectMicrophonePermissionIframe = () => {
2 |   const iframe = document.createElement("iframe");
3 |   iframe.setAttribute("hidden", "hidden");
4 |   iframe.setAttribute("id", "permissionsIFrame");
5 |   iframe.setAttribute("allow", "microphone");
6 |   iframe.src = chrome.runtime.getURL("/src/pages/permission/index.html");
7 |   document.body.appendChild(iframe);
8 | };
9 | 


--------------------------------------------------------------------------------
/src/pages/content/reverseMarkdown.ts:
--------------------------------------------------------------------------------
 1 | export function getDataFromRenderedMarkdown(selector: string) {
 2 |   const element = document.querySelector(selector);
 3 |   if (!element) {
 4 |     return null;
 5 |   }
 6 |   const text = Array.from(element.querySelectorAll("p"))
 7 |     .map((p) => p.textContent)
 8 |     .join("\n\n");
 9 |   const codeBlocks = Array.from(element.querySelectorAll("pre code")).map(
10 |     (code) => code.textContent,
11 |   );
12 | 
13 |   return { text, codeBlocks };
14 | }
15 | 


--------------------------------------------------------------------------------
/src/pages/content/ripple.ts:
--------------------------------------------------------------------------------
 1 | import { sleep } from "../../helpers/utils";
 2 | 
 3 | export default function ripple(x: number, y: number) {
 4 |   const rippleRadius = 30;
 5 |   const ripple = document.createElement("div");
 6 |   ripple.classList.add("web-agent-ripple");
 7 |   ripple.style.width = ripple.style.height = `${rippleRadius * 2}px`;
 8 |   // Take scroll position into account
 9 |   ripple.style.top = `${window.scrollY + y - rippleRadius}px`;
10 |   ripple.style.left = `${x - rippleRadius}px`;
11 | 
12 |   document.body.appendChild(ripple);
13 | 
14 |   // remove after the animation to finish
15 |   // but we don't need to `await` it
16 |   sleep(800).then(() => {
17 |     ripple.remove();
18 |   });
19 | }
20 | 


--------------------------------------------------------------------------------
/src/pages/content/style.global.scss:
--------------------------------------------------------------------------------
 1 | // IMPORTANT: this file will impact the styles on ALL PAGES
 2 | // DO NOT add style names that can easily conflict with other pages
 3 | // TODO: import this directly from fuji-web instead of copying
 4 | .web-agent-ripple {
 5 |   position: absolute;
 6 |   border-radius: 50%;
 7 |   transform: scale(0);
 8 |   animation: web-agent-ripple 0.5s ease-out;
 9 |   background-color: rgba(0, 0, 255, 0.961);
10 |   pointer-events: none;
11 |   z-index: 999999;
12 | }
13 | 
14 | @keyframes web-agent-ripple {
15 |   to {
16 |     transform: scale(3);
17 |     opacity: 0;
18 |   }
19 | }
20 | 


--------------------------------------------------------------------------------
/src/pages/content/style.scss:
--------------------------------------------------------------------------------
1 | // IMPORTANT: this file is supposed to be loaded into the shadow dom
2 | 


--------------------------------------------------------------------------------
/src/pages/devtools/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="ko">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <title>Devtools</title>
 6 |   </head>
 7 |   <body>
 8 |     <script type="module" src="./index.ts"></script>
 9 |   </body>
10 | </html>
11 | 


--------------------------------------------------------------------------------
/src/pages/devtools/index.ts:
--------------------------------------------------------------------------------
 1 | // try {
 2 | //   chrome.devtools.panels.create(
 3 | //     "Dev Tools",
 4 | //     "icon-34.png",
 5 | //     "src/pages/panel/index.html",
 6 | //   );
 7 | // } catch (e) {
 8 | //   console.error(e);
 9 | // }
10 | 


--------------------------------------------------------------------------------
/src/pages/newtab/Newtab.css:
--------------------------------------------------------------------------------
 1 | .App {
 2 |   text-align: center;
 3 | }
 4 | 
 5 | .App-logo {
 6 |   height: 40vmin;
 7 |   pointer-events: none;
 8 | }
 9 | 
10 | @media (prefers-reduced-motion: no-preference) {
11 |   .App-logo {
12 |     animation: App-logo-spin infinite 20s linear;
13 |   }
14 | }
15 | 
16 | .App-header {
17 |   min-height: 100vh;
18 |   display: flex;
19 |   flex-direction: column;
20 |   align-items: center;
21 |   justify-content: center;
22 |   font-size: calc(10px + 2vmin);
23 |   color: white;
24 | }
25 | 
26 | .App-link {
27 |   color: #61dafb;
28 | }
29 | 
30 | @keyframes App-logo-spin {
31 |   from {
32 |     transform: rotate(0deg);
33 |   }
34 |   to {
35 |     transform: rotate(360deg);
36 |   }
37 | }
38 | 


--------------------------------------------------------------------------------
/src/pages/newtab/Newtab.scss:
--------------------------------------------------------------------------------
 1 | $myColor: red;
 2 | 
 3 | h1,
 4 | h2,
 5 | h3,
 6 | h4,
 7 | h5,
 8 | h6 {
 9 |   color: $myColor;
10 | }
11 | 


--------------------------------------------------------------------------------
/src/pages/newtab/Newtab.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import logo from "@assets/img/logo.svg";
 3 | import "@pages/newtab/Newtab.css";
 4 | import "@pages/newtab/Newtab.scss";
 5 | import useStorage from "@src/shared/hooks/useStorage";
 6 | import exampleThemeStorage from "@src/shared/storages/exampleThemeStorage";
 7 | import withSuspense from "@src/shared/hoc/withSuspense";
 8 | import withErrorBoundary from "@src/shared/hoc/withErrorBoundary";
 9 | 
10 | const Newtab = () => {
11 |   const theme = useStorage(exampleThemeStorage);
12 | 
13 |   return (
14 |     <div
15 |       className="App"
16 |       style={{
17 |         backgroundColor: theme === "light" ? "#ffffff" : "#000000",
18 |       }}
19 |     >
20 |       <header
21 |         className="App-header"
22 |         style={{ color: theme === "light" ? "#000" : "#fff" }}
23 |       >
24 |         <img src={logo} className="App-logo" alt="logo" />
25 |         <p>
26 |           Edit <code>src/pages/newtab/Newtab.tsx</code> and save to reload.
27 |         </p>
28 |         <a
29 |           className="App-link"
30 |           href="https://reactjs.org"
31 |           target="_blank"
32 |           rel="noopener noreferrer"
33 |           style={{
34 |             color: theme === "light" ? "#0281dc" : undefined,
35 |             marginBottom: "10px",
36 |           }}
37 |         >
38 |           Learn React!
39 |         </a>
40 |         <h6>The color of this paragraph is defined using SASS.</h6>
41 |         <button
42 |           style={{
43 |             backgroundColor: theme === "light" ? "#fff" : "#000",
44 |             color: theme === "light" ? "#000" : "#fff",
45 |           }}
46 |           onClick={exampleThemeStorage.toggle}
47 |         >
48 |           Toggle theme
49 |         </button>
50 |       </header>
51 |     </div>
52 |   );
53 | };
54 | 
55 | export default withErrorBoundary(
56 |   withSuspense(Newtab, <div> Loading ... </div>),
57 |   <div> Error Occur </div>,
58 | );
59 | 


--------------------------------------------------------------------------------
/src/pages/newtab/index.css:
--------------------------------------------------------------------------------
 1 | body {
 2 |   margin: 0;
 3 |   font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", "Roboto", "Oxygen",
 4 |     "Ubuntu", "Cantarell", "Fira Sans", "Droid Sans", "Helvetica Neue",
 5 |     sans-serif;
 6 |   -webkit-font-smoothing: antialiased;
 7 |   -moz-osx-font-smoothing: grayscale;
 8 | }
 9 | 
10 | code {
11 |   font-family: source-code-pro, Menlo, Monaco, Consolas, "Courier New",
12 |     monospace;
13 | }
14 | 


--------------------------------------------------------------------------------
/src/pages/newtab/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="ko">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <title>New tab</title>
 6 |   </head>
 7 | 
 8 |   <body>
 9 |     <div id="app-container"></div>
10 |     <script type="module" src="./index.tsx"></script>
11 |   </body>
12 | </html>
13 | 


--------------------------------------------------------------------------------
/src/pages/newtab/index.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { createRoot } from "react-dom/client";
 3 | import Newtab from "@pages/newtab/Newtab";
 4 | import "@pages/newtab/index.css";
 5 | import refreshOnUpdate from "virtual:reload-on-update-in-view";
 6 | 
 7 | refreshOnUpdate("pages/newtab");
 8 | 
 9 | function init() {
10 |   const appContainer = document.querySelector("#app-container");
11 |   if (!appContainer) {
12 |     throw new Error("Can not find #app-container");
13 |   }
14 |   const root = createRoot(appContainer);
15 | 
16 |   root.render(<Newtab />);
17 | }
18 | 
19 | init();
20 | 


--------------------------------------------------------------------------------
/src/pages/options/Options.css:
--------------------------------------------------------------------------------
1 | .container {
2 |   width: 100%;
3 |   height: 50vh;
4 |   font-size: 2rem;
5 |   display: flex;
6 |   align-items: center;
7 |   justify-content: center;
8 | }
9 | 


--------------------------------------------------------------------------------
/src/pages/options/Options.tsx:
--------------------------------------------------------------------------------
1 | import React from "react";
2 | import "@pages/options/Options.css";
3 | 
4 | const Options: React.FC = () => {
5 |   return <div className="container">Options</div>;
6 | };
7 | 
8 | export default Options;
9 | 


--------------------------------------------------------------------------------
/src/pages/options/index.css:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/normal-computing/fuji-web/1aec509e4c437ca7764a5b4a56deaeba18691729/src/pages/options/index.css


--------------------------------------------------------------------------------
/src/pages/options/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="ko">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <title>Options</title>
 6 |   </head>
 7 | 
 8 |   <body>
 9 |     <div id="app-container"></div>
10 |     <script type="module" src="./index.tsx"></script>
11 |   </body>
12 | </html>
13 | 


--------------------------------------------------------------------------------
/src/pages/options/index.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { createRoot } from "react-dom/client";
 3 | import Options from "@pages/options/Options";
 4 | import "@pages/options/index.css";
 5 | import refreshOnUpdate from "virtual:reload-on-update-in-view";
 6 | 
 7 | refreshOnUpdate("pages/options");
 8 | 
 9 | function init() {
10 |   const appContainer = document.querySelector("#app-container");
11 |   if (!appContainer) {
12 |     throw new Error("Can not find #app-container");
13 |   }
14 |   const root = createRoot(appContainer);
15 |   root.render(<Options />);
16 | }
17 | 
18 | init();
19 | 


--------------------------------------------------------------------------------
/src/pages/panel/Panel.css:
--------------------------------------------------------------------------------
1 | body {
2 |   background-color: #242424;
3 | }
4 | 
5 | .container {
6 |   color: #ffffff;
7 | }
8 | 


--------------------------------------------------------------------------------
/src/pages/panel/Panel.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import "@pages/panel/Panel.css";
 3 | 
 4 | const Panel: React.FC = () => {
 5 |   return (
 6 |     <div className="container">
 7 |       <h1 className="">Dev Tools Panel</h1>
 8 |     </div>
 9 |   );
10 | };
11 | 
12 | export default Panel;
13 | 


--------------------------------------------------------------------------------
/src/pages/panel/index.css:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/normal-computing/fuji-web/1aec509e4c437ca7764a5b4a56deaeba18691729/src/pages/panel/index.css


--------------------------------------------------------------------------------
/src/pages/panel/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="ko">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <title>Devtools Panel</title>
 6 |   </head>
 7 | 
 8 |   <body>
 9 |     <div id="app-container"></div>
10 |     <script type="module" src="./index.tsx"></script>
11 |   </body>
12 | </html>
13 | 


--------------------------------------------------------------------------------
/src/pages/panel/index.tsx:
--------------------------------------------------------------------------------
 1 | // import React from "react";
 2 | // import { createRoot } from "react-dom/client";
 3 | // import Panel from "@pages/panel/Panel";
 4 | // import "@pages/panel/index.css";
 5 | // import refreshOnUpdate from "virtual:reload-on-update-in-view";
 6 | 
 7 | // refreshOnUpdate("pages/panel");
 8 | 
 9 | // function init() {
10 | //   const appContainer = document.querySelector("#app-container");
11 | //   if (!appContainer) {
12 | //     throw new Error("Can not find #app-container");
13 | //   }
14 | //   const root = createRoot(appContainer);
15 | //   root.render(<Panel />);
16 | // }
17 | 
18 | // init();
19 | 


--------------------------------------------------------------------------------
/src/pages/permission/index.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html>
 3 |   <head>
 4 |     <title>Request Permissions</title>
 5 |     <script type="module" src="./requestPermission.ts"></script>
 6 |   </head>
 7 |   <body>
 8 |     <!-- Display loading or informative message here -->
 9 |   </body>
10 | </html>


--------------------------------------------------------------------------------
/src/pages/permission/requestPermission.ts:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Requests user permission for microphone access.
 3 |  * @returns {Promise<void>} A Promise that resolves when permission is granted or rejects with an error.
 4 |  */
 5 | export async function getUserPermission(): Promise<void> {
 6 |   return new Promise((resolve, reject) => {
 7 |     // Using navigator.mediaDevices.getUserMedia to request microphone access
 8 |     navigator.mediaDevices
 9 |       .getUserMedia({ audio: true })
10 |       .then((stream) => {
11 |         // Permission granted, handle the stream if needed
12 |         console.log("Microphone access granted");
13 | 
14 |         // Stop the tracks to prevent the recording indicator from being shown
15 |         stream.getTracks().forEach(function (track) {
16 |           track.stop();
17 |         });
18 | 
19 |         resolve();
20 |       })
21 |       .catch((error) => {
22 |         console.error("Error requesting microphone permission", error);
23 | 
24 |         // Handling different error scenarios
25 |         if (error.name === "Permission denied") {
26 |           // TODO: catch this error and show a user-friendly message
27 |           reject(new Error("MICROPHONE_PERMISSION_DENIED"));
28 |         } else {
29 |           reject(error);
30 |         }
31 |       });
32 |   });
33 | }
34 | 
35 | // Call the function to request microphone permission
36 | getUserPermission();
37 | 


--------------------------------------------------------------------------------
/src/pages/popup/Popup.css:
--------------------------------------------------------------------------------
 1 | .App {
 2 |   position: absolute;
 3 |   top: 0;
 4 |   bottom: 0;
 5 |   left: 0;
 6 |   right: 0;
 7 |   text-align: center;
 8 |   height: 100%;
 9 |   padding: 10px;
10 |   background-color: #282c34;
11 | }
12 | 
13 | .App-logo {
14 |   height: 30vmin;
15 |   pointer-events: none;
16 | }
17 | 
18 | @media (prefers-reduced-motion: no-preference) {
19 |   .App-logo {
20 |     animation: App-logo-spin infinite 20s linear;
21 |   }
22 | }
23 | 
24 | .App-header {
25 |   height: 100%;
26 |   display: flex;
27 |   flex-direction: column;
28 |   align-items: center;
29 |   justify-content: center;
30 |   font-size: calc(10px + 2vmin);
31 |   color: white;
32 | }
33 | 
34 | .App-link {
35 |   color: #61dafb;
36 | }
37 | 
38 | @keyframes App-logo-spin {
39 |   from {
40 |     transform: rotate(0deg);
41 |   }
42 |   to {
43 |     transform: rotate(360deg);
44 |   }
45 | }
46 | 


--------------------------------------------------------------------------------
/src/pages/popup/Popup.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import logo from "@assets/img/logo.svg";
 3 | import "@pages/popup/Popup.css";
 4 | import useStorage from "@src/shared/hooks/useStorage";
 5 | import exampleThemeStorage from "@src/shared/storages/exampleThemeStorage";
 6 | import withSuspense from "@src/shared/hoc/withSuspense";
 7 | import withErrorBoundary from "@src/shared/hoc/withErrorBoundary";
 8 | 
 9 | const Popup = () => {
10 |   const theme = useStorage(exampleThemeStorage);
11 | 
12 |   return (
13 |     <div
14 |       className="App"
15 |       style={{
16 |         backgroundColor: theme === "light" ? "#fff" : "#000",
17 |       }}
18 |     >
19 |       <header
20 |         className="App-header"
21 |         style={{ color: theme === "light" ? "#000" : "#fff" }}
22 |       >
23 |         <img src={logo} className="App-logo" alt="logo" />
24 |         <p>
25 |           Edit <code>src/pages/popup/Popup.tsx</code> and save to reload.
26 |         </p>
27 |         <a
28 |           className="App-link"
29 |           href="https://reactjs.org"
30 |           target="_blank"
31 |           rel="noopener noreferrer"
32 |           style={{
33 |             color: theme === "light" ? "#0281dc" : undefined,
34 |             marginBottom: "10px",
35 |           }}
36 |         >
37 |           Learn React!
38 |         </a>
39 |         <button
40 |           style={{
41 |             backgroundColor: theme === "light" ? "#fff" : "#000",
42 |             color: theme === "light" ? "#000" : "#fff",
43 |           }}
44 |           onClick={exampleThemeStorage.toggle}
45 |         >
46 |           Toggle theme
47 |         </button>
48 |       </header>
49 |     </div>
50 |   );
51 | };
52 | 
53 | export default withErrorBoundary(
54 |   withSuspense(Popup, <div> Loading ... </div>),
55 |   <div> Error Occur </div>,
56 | );
57 | 


--------------------------------------------------------------------------------
/src/pages/popup/index.css:
--------------------------------------------------------------------------------
 1 | body {
 2 |   width: 300px;
 3 |   height: 260px;
 4 |   margin: 0;
 5 |   font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", "Roboto", "Oxygen",
 6 |     "Ubuntu", "Cantarell", "Fira Sans", "Droid Sans", "Helvetica Neue",
 7 |     sans-serif;
 8 |   -webkit-font-smoothing: antialiased;
 9 |   -moz-osx-font-smoothing: grayscale;
10 | 
11 |   position: relative;
12 | }
13 | 
14 | code {
15 |   font-family: source-code-pro, Menlo, Monaco, Consolas, "Courier New",
16 |     monospace;
17 | }
18 | 


--------------------------------------------------------------------------------
/src/pages/popup/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="ko">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <title>Popup</title>
 6 |   </head>
 7 | 
 8 |   <body>
 9 |     <div id="app-container"></div>
10 |     <script type="module" src="./index.tsx"></script>
11 |   </body>
12 | </html>
13 | 


--------------------------------------------------------------------------------
/src/pages/popup/index.tsx:
--------------------------------------------------------------------------------
 1 | // import React from "react";
 2 | // import { createRoot } from "react-dom/client";
 3 | // import "@pages/popup/index.css";
 4 | // import Popup from "@pages/popup/Popup";
 5 | // import refreshOnUpdate from "virtual:reload-on-update-in-view";
 6 | 
 7 | // refreshOnUpdate("pages/popup");
 8 | 
 9 | // function init() {
10 | //   const appContainer = document.querySelector("#app-container");
11 | //   if (!appContainer) {
12 | //     throw new Error("Can not find #app-container");
13 | //   }
14 | //   const root = createRoot(appContainer);
15 | //   root.render(<Popup />);
16 | // }
17 | 
18 | // init();
19 | 


--------------------------------------------------------------------------------
/src/pages/sidepanel/index.css:
--------------------------------------------------------------------------------
 1 | body {
 2 |   min-height: 100dvh;
 3 |   margin: 0;
 4 |   font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", "Roboto", "Oxygen",
 5 |     "Ubuntu", "Cantarell", "Fira Sans", "Droid Sans", "Helvetica Neue",
 6 |     sans-serif;
 7 |   -webkit-font-smoothing: antialiased;
 8 |   -moz-osx-font-smoothing: grayscale;
 9 | 
10 |   position: relative;
11 |   background-color: white;
12 | }
13 | 
14 | code {
15 |   font-family: source-code-pro, Menlo, Monaco, Consolas, "Courier New",
16 |     monospace;
17 | }
18 | 


--------------------------------------------------------------------------------
/src/pages/sidepanel/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="ko">
 3 |   <head>
 4 |     <meta charset="UTF-8" />
 5 |     <title>Side Panel</title>
 6 |   </head>
 7 | 
 8 |   <body>
 9 |     <div id="app-container"></div>
10 |     <script type="module" src="./index.tsx"></script>
11 |   </body>
12 | </html>
13 | 


--------------------------------------------------------------------------------
/src/pages/sidepanel/index.tsx:
--------------------------------------------------------------------------------
 1 | import { createRoot } from "react-dom/client";
 2 | 
 3 | import App from "@src/common/App";
 4 | 
 5 | import refreshOnUpdate from "virtual:reload-on-update-in-view";
 6 | 
 7 | refreshOnUpdate("pages/sidepanel");
 8 | 
 9 | function init() {
10 |   const appContainer = document.querySelector("#app-container");
11 |   if (!appContainer) {
12 |     throw new Error("Can not find #app-container");
13 |   }
14 |   const root = createRoot(appContainer);
15 |   root.render(<App />);
16 | }
17 | 
18 | init();
19 | 


--------------------------------------------------------------------------------
/src/shared/hoc/withErrorBoundary.tsx:
--------------------------------------------------------------------------------
 1 | import { Component, ComponentType, ReactElement, ErrorInfo } from "react";
 2 | 
 3 | class ErrorBoundary extends Component<
 4 |   {
 5 |     children: ReactElement;
 6 |     fallback: ReactElement;
 7 |   },
 8 |   {
 9 |     hasError: boolean;
10 |   }
11 | > {
12 |   state = { hasError: false };
13 | 
14 |   static getDerivedStateFromError() {
15 |     return { hasError: true };
16 |   }
17 | 
18 |   componentDidCatch(error: Error, errorInfo: ErrorInfo) {
19 |     console.error(error, errorInfo);
20 |   }
21 | 
22 |   render() {
23 |     if (this.state.hasError) {
24 |       return this.props.fallback;
25 |     }
26 | 
27 |     return this.props.children;
28 |   }
29 | }
30 | 
31 | export default function withErrorBoundary<T extends Record<string, unknown>>(
32 |   Component: ComponentType<T>,
33 |   ErrorComponent: ReactElement,
34 | ) {
35 |   return function WithErrorBoundary(props: T) {
36 |     return (
37 |       <ErrorBoundary fallback={ErrorComponent}>
38 |         <Component {...props} />
39 |       </ErrorBoundary>
40 |     );
41 |   };
42 | }
43 | 


--------------------------------------------------------------------------------
/src/shared/hoc/withSuspense.tsx:
--------------------------------------------------------------------------------
 1 | import { ComponentType, ReactElement, Suspense } from "react";
 2 | 
 3 | export default function withSuspense<T extends Record<string, unknown>>(
 4 |   Component: ComponentType<T>,
 5 |   SuspenseComponent: ReactElement,
 6 | ) {
 7 |   return function WithSuspense(props: T) {
 8 |     return (
 9 |       <Suspense fallback={SuspenseComponent}>
10 |         <Component {...props} />
11 |       </Suspense>
12 |     );
13 |   };
14 | }
15 | 


--------------------------------------------------------------------------------
/src/shared/hooks/useStorage.tsx:
--------------------------------------------------------------------------------
 1 | import { useSyncExternalStore } from "react";
 2 | import { BaseStorage } from "@src/shared/storages/base";
 3 | 
 4 | type WrappedPromise = ReturnType<typeof wrapPromise>;
 5 | const storageMap: Map<BaseStorage<unknown>, WrappedPromise> = new Map();
 6 | 
 7 | export default function useStorage<
 8 |   Storage extends BaseStorage<Data>,
 9 |   Data = Storage extends BaseStorage<infer Data> ? Data : unknown,
10 | >(storage: Storage) {
11 |   const map = storageMap as Map<Storage, WrappedPromise>;
12 |   const _data = useSyncExternalStore<Data | null>(
13 |     storage.subscribe,
14 |     storage.getSnapshot,
15 |   );
16 | 
17 |   if (!map.has(storage)) {
18 |     map.set(storage, wrapPromise(storage.get()));
19 |   }
20 |   if (_data !== null) {
21 |     map.set(storage, { read: () => _data });
22 |   }
23 | 
24 |   return _data ?? (map.get(storage)!.read() as Data);
25 | }
26 | 
27 | function wrapPromise<R>(promise: Promise<R>) {
28 |   let status = "pending";
29 |   let result: R;
30 |   const suspender = promise.then(
31 |     (r) => {
32 |       status = "success";
33 |       result = r;
34 |     },
35 |     (e) => {
36 |       status = "error";
37 |       result = e;
38 |     },
39 |   );
40 | 
41 |   return {
42 |     read() {
43 |       if (status === "pending") {
44 |         throw suspender;
45 |       } else if (status === "error") {
46 |         throw result;
47 |       } else if (status === "success") {
48 |         return result;
49 |       }
50 |     },
51 |   };
52 | }
53 | 


--------------------------------------------------------------------------------
/src/shared/images/mergeScreenshots.ts:
--------------------------------------------------------------------------------
  1 | // TODO: make it configurable?
  2 | const DEFAULT_FONT_SIZE = 40;
  3 | const DEFAULT_FONT_STYLE = `${DEFAULT_FONT_SIZE}px serif`;
  4 | 
  5 | export type ImageSourceAttrs = {
  6 |   src: string;
  7 |   caption?: string;
  8 |   opacity?: number | undefined;
  9 | };
 10 | 
 11 | type ExtendedImageData = ImageSourceAttrs & {
 12 |   img: HTMLImageElement;
 13 | };
 14 | 
 15 | export type MergeImageOptionsInput = {
 16 |   format?: string;
 17 |   quality?: number;
 18 |   maxFileSizeMB?: number;
 19 |   padding?: number;
 20 | };
 21 | 
 22 | type MergeImageOptions = MergeImageOptionsInput & {
 23 |   format: string;
 24 |   padding: number;
 25 | };
 26 | 
 27 | export type GetCanvasSize = (
 28 |   images: ExtendedImageData[],
 29 |   options: MergeImageOptions,
 30 | ) => {
 31 |   width: number;
 32 |   height: number;
 33 | };
 34 | 
 35 | const getHorizontalLayoutCanvasSize: GetCanvasSize = (images, options) => {
 36 |   let width = 0;
 37 |   let height = 0;
 38 |   images.forEach((image) => {
 39 |     const padding = options.padding;
 40 |     width += image.img.width + padding * 2;
 41 |     height = Math.max(height, image.img.height + padding * 2);
 42 |   });
 43 |   return {
 44 |     width,
 45 |     height: height + DEFAULT_FONT_SIZE,
 46 |   };
 47 | };
 48 | 
 49 | // Function to get WebP data URL and ensure it's less than 5 MB
 50 | function getWebPDataURL(
 51 |   canvas: HTMLCanvasElement,
 52 |   maxFileSizeMB: number = 5,
 53 |   maxQuality = 1,
 54 |   qualityStep = 0.05,
 55 | ) {
 56 |   const maxFileSizeBytes = maxFileSizeMB * 1024 * 1024;
 57 |   let quality = maxQuality;
 58 |   let dataURL = canvas.toDataURL("image/webp", quality);
 59 | 
 60 |   // Check the size of the data URL
 61 |   while (dataURL.length * 0.75 > maxFileSizeBytes && quality > 0) {
 62 |     quality -= qualityStep; // Decrease quality
 63 |     dataURL = canvas.toDataURL("image/webp", quality);
 64 |   }
 65 | 
 66 |   return dataURL;
 67 | }
 68 | 
 69 | // Defaults
 70 | const defaultOptions: MergeImageOptions = {
 71 |   format: "image/webp",
 72 |   quality: 1,
 73 |   maxFileSizeMB: 5,
 74 |   padding: 40,
 75 | };
 76 | 
 77 | const mergeImages = async (
 78 |   sources: ImageSourceAttrs[] = [],
 79 |   optionsInput: MergeImageOptionsInput = {},
 80 | ) => {
 81 |   const options: MergeImageOptions = {
 82 |     ...defaultOptions,
 83 |     ...optionsInput,
 84 |   };
 85 | 
 86 |   // Setup browser/Node.js specific variables
 87 |   const canvas = window.document.createElement("canvas");
 88 | 
 89 |   // Load sources
 90 |   const images: Promise<ExtendedImageData>[] = sources.map(
 91 |     (source) =>
 92 |       new Promise((resolve, reject) => {
 93 |         // Resolve source and img when loaded
 94 |         const img = new Image();
 95 |         img.onerror = () => reject(new Error("Couldn't load image"));
 96 |         const data = {
 97 |           ...source,
 98 |           img,
 99 |         };
100 |         img.onload = () => resolve(data);
101 |         img.src = source.src;
102 |       }),
103 |   );
104 | 
105 |   // Get canvas context
106 |   const ctx = canvas.getContext("2d");
107 |   if (!ctx) {
108 |     throw new Error("Could not get canvas context");
109 |   }
110 | 
111 |   // When sources have loaded
112 |   return await Promise.all(images).then((images) => {
113 |     // Set canvas dimensions
114 |     const canvasSize = getHorizontalLayoutCanvasSize(images, options);
115 |     canvas.width = canvasSize.width;
116 |     canvas.height = canvasSize.height;
117 |     // fill canvas with gray background
118 |     ctx.fillStyle = "#f0f0f0";
119 |     ctx.fillRect(0, 0, canvas.width, canvas.height);
120 | 
121 |     // Draw images and captions to canvas (horizontally)
122 |     let x = options.padding;
123 |     const y = options.padding;
124 |     ctx.textAlign = "center";
125 |     ctx.font = DEFAULT_FONT_STYLE;
126 |     ctx.fillStyle = "black";
127 |     ctx.strokeStyle = "black";
128 |     images.forEach((image) => {
129 |       ctx.globalAlpha = image.opacity ?? 1;
130 |       ctx.drawImage(image.img, x, y);
131 |       // border around image
132 |       ctx.strokeRect(x, y, image.img.width, image.img.height);
133 |       if (image.caption != null) {
134 |         ctx.fillText(
135 |           image.caption,
136 |           x + image.img.width / 2,
137 |           y + image.img.height + DEFAULT_FONT_SIZE,
138 |         );
139 |       }
140 |       // Increment x to where the next image should be drawn
141 |       x += image.img.width + options.padding;
142 |     });
143 | 
144 |     if (options.format === "image/webp") {
145 |       return getWebPDataURL(canvas, options.maxFileSizeMB, options.quality);
146 |     }
147 | 
148 |     return canvas.toDataURL(options.format, options.quality);
149 |   });
150 | };
151 | 
152 | export default mergeImages;
153 | 


--------------------------------------------------------------------------------
/src/shared/storages/base.ts:
--------------------------------------------------------------------------------
 1 | export enum StorageType {
 2 |   Local = "local",
 3 |   Sync = "sync",
 4 |   Managed = "managed",
 5 |   Session = "session",
 6 | }
 7 | 
 8 | type ValueOrUpdate<D> = D | ((prev: D) => Promise<D> | D);
 9 | 
10 | export type BaseStorage<D> = {
11 |   get: () => Promise<D>;
12 |   set: (value: ValueOrUpdate<D>) => Promise<void>;
13 |   getSnapshot: () => D | null;
14 |   subscribe: (listener: () => void) => () => void;
15 | };
16 | 
17 | export function createStorage<D>(
18 |   key: string,
19 |   fallback: D,
20 |   config?: { storageType?: StorageType },
21 | ): BaseStorage<D> {
22 |   let cache: D | null = null;
23 |   let listeners: Array<() => void> = [];
24 |   const storageType = config?.storageType ?? StorageType.Local;
25 | 
26 |   const _getDataFromStorage = async (): Promise<D> => {
27 |     if (chrome.storage[storageType] === undefined) {
28 |       throw new Error(
29 |         `Check your storage permission into manifest.json: ${storageType} is not defined`,
30 |       );
31 |     }
32 |     const value = await chrome.storage[storageType].get([key]);
33 |     return value[key] ?? fallback;
34 |   };
35 | 
36 |   const _emitChange = () => {
37 |     listeners.forEach((listener) => listener());
38 |   };
39 | 
40 |   const set = async (valueOrUpdate: ValueOrUpdate<D>) => {
41 |     if (typeof valueOrUpdate === "function") {
42 |       // eslint-disable-next-line no-prototype-builtins
43 |       if (valueOrUpdate.hasOwnProperty("then")) {
44 |         // eslint-disable-next-line @typescript-eslint/ban-ts-comment
45 |         // @ts-ignore
46 |         cache = await valueOrUpdate(cache);
47 |       } else {
48 |         // eslint-disable-next-line @typescript-eslint/ban-ts-comment
49 |         // @ts-ignore
50 |         cache = valueOrUpdate(cache);
51 |       }
52 |     } else {
53 |       cache = valueOrUpdate;
54 |     }
55 |     await chrome.storage[storageType].set({ [key]: cache });
56 |     _emitChange();
57 |   };
58 | 
59 |   const subscribe = (listener: () => void) => {
60 |     listeners = [...listeners, listener];
61 |     return () => {
62 |       listeners = listeners.filter((l) => l !== listener);
63 |     };
64 |   };
65 | 
66 |   const getSnapshot = () => {
67 |     return cache;
68 |   };
69 | 
70 |   _getDataFromStorage().then((data) => {
71 |     cache = data;
72 |     _emitChange();
73 |   });
74 | 
75 |   return {
76 |     get: _getDataFromStorage,
77 |     set,
78 |     getSnapshot,
79 |     subscribe,
80 |   };
81 | }
82 | 


--------------------------------------------------------------------------------
/src/shared/storages/exampleThemeStorage.ts:
--------------------------------------------------------------------------------
 1 | import {
 2 |   BaseStorage,
 3 |   createStorage,
 4 |   StorageType,
 5 | } from "@src/shared/storages/base";
 6 | 
 7 | type Theme = "light" | "dark";
 8 | 
 9 | type ThemeStorage = BaseStorage<Theme> & {
10 |   toggle: () => void;
11 | };
12 | 
13 | const storage = createStorage<Theme>("theme-storage-key", "light", {
14 |   storageType: StorageType.Local,
15 | });
16 | 
17 | const exampleThemeStorage: ThemeStorage = {
18 |   ...storage,
19 |   // TODO: extends your own methods
20 |   toggle: () => {
21 |     storage.set((currentTheme) => {
22 |       return currentTheme === "light" ? "dark" : "light";
23 |     });
24 |   },
25 | };
26 | 
27 | export default exampleThemeStorage;
28 | 


--------------------------------------------------------------------------------
/src/state/settings.ts:
--------------------------------------------------------------------------------
 1 | import { type Data } from "../helpers/knowledge/index";
 2 | import { MyStateCreator } from "./store";
 3 | import {
 4 |   SupportedModels,
 5 |   findBestMatchingModel,
 6 |   AgentMode,
 7 | } from "../helpers/aiSdkUtils";
 8 | 
 9 | export type SettingsSlice = {
10 |   openAIKey: string | undefined;
11 |   anthropicKey: string | undefined;
12 |   openAIBaseUrl: string | undefined;
13 |   anthropicBaseUrl: string | undefined;
14 |   geminiKey: string | undefined;
15 |   selectedModel: SupportedModels;
16 |   agentMode: AgentMode;
17 |   voiceMode: boolean;
18 |   customKnowledgeBase: Data;
19 |   actions: {
20 |     update: (values: Partial<SettingsSlice>) => void;
21 |   };
22 | };
23 | export const createSettingsSlice: MyStateCreator<SettingsSlice> = (set) => ({
24 |   openAIKey: undefined,
25 |   anthropicKey: undefined,
26 |   openAIBaseUrl: undefined,
27 |   anthropicBaseUrl: undefined,
28 |   geminiKey: undefined,
29 |   agentMode: AgentMode.VisionEnhanced,
30 |   selectedModel: SupportedModels.Gpt4Turbo,
31 |   voiceMode: false,
32 |   customKnowledgeBase: {},
33 |   actions: {
34 |     update: (values) => {
35 |       set((state) => {
36 |         const newSettings: SettingsSlice = { ...state.settings, ...values };
37 |         newSettings.selectedModel = findBestMatchingModel(
38 |           newSettings.selectedModel,
39 |           newSettings.agentMode,
40 |           newSettings.openAIKey,
41 |           newSettings.anthropicKey,
42 |           newSettings.geminiKey,
43 |         );
44 |         // voice model current relies on OpenAI API key
45 |         if (!newSettings.openAIKey) {
46 |           newSettings.voiceMode = false;
47 |         }
48 |         state.settings = newSettings;
49 |       });
50 |     },
51 |   },
52 | });
53 | 


--------------------------------------------------------------------------------
/src/state/store.ts:
--------------------------------------------------------------------------------
 1 | import { merge } from "lodash";
 2 | import { create, StateCreator } from "zustand";
 3 | import { immer } from "zustand/middleware/immer";
 4 | import { createJSONStorage, devtools, persist } from "zustand/middleware";
 5 | import { createCurrentTaskSlice, CurrentTaskSlice } from "./currentTask";
 6 | import { createUiSlice, UiSlice } from "./ui";
 7 | import { createSettingsSlice, SettingsSlice } from "./settings";
 8 | import { findBestMatchingModel } from "../helpers/aiSdkUtils";
 9 | 
10 | export type StoreType = {
11 |   currentTask: CurrentTaskSlice;
12 |   ui: UiSlice;
13 |   settings: SettingsSlice;
14 | };
15 | 
16 | export type MyStateCreator<T> = StateCreator<
17 |   StoreType,
18 |   [["zustand/immer", never]],
19 |   [],
20 |   T
21 | >;
22 | 
23 | export const useAppState = create<StoreType>()(
24 |   persist(
25 |     immer(
26 |       devtools((...a) => ({
27 |         currentTask: createCurrentTaskSlice(...a),
28 |         ui: createUiSlice(...a),
29 |         settings: createSettingsSlice(...a),
30 |       })),
31 |     ),
32 |     {
33 |       name: "app-state",
34 |       storage: createJSONStorage(() => localStorage),
35 |       partialize: (state) => ({
36 |         // Stuff we want to persist
37 |         ui: {
38 |           instructions: state.ui.instructions,
39 |         },
40 |         settings: {
41 |           openAIKey: state.settings.openAIKey,
42 |           anthropicKey: state.settings.anthropicKey,
43 |           geminiKey: state.settings.geminiKey,
44 |           openAIBaseUrl: state.settings.openAIBaseUrl,
45 |           anthropicBaseUrl: state.settings.anthropicBaseUrl,
46 |           agentMode: state.settings.agentMode,
47 |           selectedModel: state.settings.selectedModel,
48 |           voiceMode: state.settings.voiceMode,
49 |           customKnowledgeBase: state.settings.customKnowledgeBase,
50 |         },
51 |       }),
52 |       merge: (persistedState, currentState) => {
53 |         const result = merge(currentState, persistedState);
54 |         result.settings.selectedModel = findBestMatchingModel(
55 |           result.settings.selectedModel,
56 |           result.settings.agentMode,
57 |           result.settings.openAIKey,
58 |           result.settings.anthropicKey,
59 |           result.settings.geminiKey,
60 |         );
61 |         return result;
62 |       },
63 |     },
64 |   ),
65 | );
66 | 
67 | // @ts-expect-error used for debugging
68 | window.getState = useAppState.getState;
69 | 


--------------------------------------------------------------------------------
/src/state/ui.ts:
--------------------------------------------------------------------------------
 1 | import { MyStateCreator } from "./store";
 2 | 
 3 | export type UiSlice = {
 4 |   instructions: string | null;
 5 |   actions: {
 6 |     setInstructions: (instructions: string) => void;
 7 |   };
 8 | };
 9 | export const createUiSlice: MyStateCreator<UiSlice> = (set) => ({
10 |   instructions: null,
11 |   actions: {
12 |     setInstructions: (instructions) => {
13 |       set((state) => {
14 |         state.ui.instructions = instructions;
15 |       });
16 |     },
17 |   },
18 | });
19 | 


--------------------------------------------------------------------------------
/src/vite-env.d.ts:
--------------------------------------------------------------------------------
1 | /// <reference types="vite/client" />
2 | 


--------------------------------------------------------------------------------
/tailwind.config.js:
--------------------------------------------------------------------------------
1 | /** @type {import('tailwindcss').Config} */
2 | export default {
3 |   content: ["./index.html", "./src/**/*.{js,ts,jsx,tsx}"],
4 |   theme: {
5 |     extend: {},
6 |   },
7 |   plugins: [],
8 | };
9 | 


--------------------------------------------------------------------------------
/test-utils/jest.setup.js:
--------------------------------------------------------------------------------
1 | // Do what you need to set up your test
2 | console.log("setup test: jest.setup.js");
3 | 


--------------------------------------------------------------------------------
/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "strict": true,
 4 |     "noEmit": true,
 5 |     "baseUrl": ".",
 6 |     "allowJs": false,
 7 |     "target": "esnext",
 8 |     "module": "esnext",
 9 |     "jsx": "react-jsx",
10 |     "skipLibCheck": true,
11 |     "esModuleInterop": true,
12 |     "resolveJsonModule": true,
13 |     "moduleResolution": "node",
14 |     "types": ["vite/client", "node"],
15 |     "noFallthroughCasesInSwitch": true,
16 |     "allowSyntheticDefaultImports": true,
17 |     "lib": ["dom", "dom.iterable", "esnext"],
18 |     "forceConsistentCasingInFileNames": true,
19 |     "typeRoots": ["./src/global.d.ts", "node_modules/@types"],
20 |     "paths": {
21 |       "@root/*": ["./*"],
22 |       "@src/*": ["src/*"],
23 |       "@assets/*": ["src/assets/*"],
24 |       "@pages/*": ["src/pages/*"],
25 |       "virtual:reload-on-update-in-background-script": ["./src/global.d.ts"],
26 |       "virtual:reload-on-update-in-view": ["./src/global.d.ts"]
27 |     }
28 |   },
29 |   "include": ["src", "utils", "vite.config.ts", "node_modules/@types"]
30 | }
31 | 


--------------------------------------------------------------------------------
/utils/log.ts:
--------------------------------------------------------------------------------
 1 | type ColorType = "success" | "info" | "error" | "warning" | keyof typeof COLORS;
 2 | type ValueOf<T> = T[keyof T];
 3 | 
 4 | export default function colorLog(message: string, type: ColorType) {
 5 |   let color: ValueOf<typeof COLORS>;
 6 | 
 7 |   switch (type) {
 8 |     case "success":
 9 |       color = COLORS.FgGreen;
10 |       break;
11 |     case "info":
12 |       color = COLORS.FgBlue;
13 |       break;
14 |     case "error":
15 |       color = COLORS.FgRed;
16 |       break;
17 |     case "warning":
18 |       color = COLORS.FgYellow;
19 |       break;
20 |     default:
21 |       color = COLORS[type];
22 |       break;
23 |   }
24 | 
25 |   console.log(color, message);
26 | }
27 | 
28 | const COLORS = {
29 |   Reset: "\x1b[0m",
30 |   Bright: "\x1b[1m",
31 |   Dim: "\x1b[2m",
32 |   Underscore: "\x1b[4m",
33 |   Blink: "\x1b[5m",
34 |   Reverse: "\x1b[7m",
35 |   Hidden: "\x1b[8m",
36 |   FgBlack: "\x1b[30m",
37 |   FgRed: "\x1b[31m",
38 |   FgGreen: "\x1b[32m",
39 |   FgYellow: "\x1b[33m",
40 |   FgBlue: "\x1b[34m",
41 |   FgMagenta: "\x1b[35m",
42 |   FgCyan: "\x1b[36m",
43 |   FgWhite: "\x1b[37m",
44 |   BgBlack: "\x1b[40m",
45 |   BgRed: "\x1b[41m",
46 |   BgGreen: "\x1b[42m",
47 |   BgYellow: "\x1b[43m",
48 |   BgBlue: "\x1b[44m",
49 |   BgMagenta: "\x1b[45m",
50 |   BgCyan: "\x1b[46m",
51 |   BgWhite: "\x1b[47m",
52 | } as const;
53 | 


--------------------------------------------------------------------------------
/utils/manifest-parser/index.ts:
--------------------------------------------------------------------------------
 1 | type Manifest = chrome.runtime.ManifestV3;
 2 | 
 3 | class ManifestParser {
 4 |   // eslint-disable-next-line @typescript-eslint/no-empty-function
 5 |   private constructor() {}
 6 | 
 7 |   static convertManifestToString(manifest: Manifest): string {
 8 |     if (process.env.__FIREFOX__) {
 9 |       manifest = this.convertToFirefoxCompatibleManifest(manifest);
10 |     }
11 |     return JSON.stringify(manifest, null, 2);
12 |   }
13 | 
14 |   static convertToFirefoxCompatibleManifest(manifest: Manifest) {
15 |     const manifestCopy = {
16 |       ...manifest,
17 |     } as { [key: string]: unknown };
18 | 
19 |     manifestCopy.background = {
20 |       scripts: [manifest.background?.service_worker],
21 |       type: "module",
22 |     };
23 |     manifestCopy.options_ui = {
24 |       page: manifest.options_page,
25 |       browser_style: false,
26 |     };
27 |     manifestCopy.content_security_policy = {
28 |       extension_pages: "script-src 'self'; object-src 'self'",
29 |     };
30 |     delete manifestCopy.options_page;
31 |     return manifestCopy as Manifest;
32 |   }
33 | }
34 | 
35 | export default ManifestParser;
36 | 


--------------------------------------------------------------------------------
/utils/plugins/add-hmr.ts:
--------------------------------------------------------------------------------
 1 | import * as path from "path";
 2 | import { readFileSync } from "fs";
 3 | import type { PluginOption } from "vite";
 4 | 
 5 | const isDev = process.env.__DEV__ === "true";
 6 | 
 7 | const DUMMY_CODE = `export default function(){};`;
 8 | 
 9 | function getInjectionCode(fileName: string): string {
10 |   return readFileSync(
11 |     path.resolve(__dirname, "..", "reload", "injections", fileName),
12 |     { encoding: "utf8" },
13 |   );
14 | }
15 | 
16 | type Config = {
17 |   background?: boolean;
18 |   view?: boolean;
19 | };
20 | 
21 | export default function addHmr(config?: Config): PluginOption {
22 |   const { background = false, view = true } = config || {};
23 |   const idInBackgroundScript = "virtual:reload-on-update-in-background-script";
24 |   const idInView = "virtual:reload-on-update-in-view";
25 | 
26 |   const scriptHmrCode = isDev ? getInjectionCode("script.js") : DUMMY_CODE;
27 |   const viewHmrCode = isDev ? getInjectionCode("view.js") : DUMMY_CODE;
28 | 
29 |   return {
30 |     name: "add-hmr",
31 |     resolveId(id) {
32 |       if (id === idInBackgroundScript || id === idInView) {
33 |         return getResolvedId(id);
34 |       }
35 |     },
36 |     load(id) {
37 |       if (id === getResolvedId(idInBackgroundScript)) {
38 |         return background ? scriptHmrCode : DUMMY_CODE;
39 |       }
40 | 
41 |       if (id === getResolvedId(idInView)) {
42 |         return view ? viewHmrCode : DUMMY_CODE;
43 |       }
44 |     },
45 |   };
46 | }
47 | 
48 | function getResolvedId(id: string) {
49 |   return "\0" + id;
50 | }
51 | 


--------------------------------------------------------------------------------
/utils/plugins/custom-dynamic-import.ts:
--------------------------------------------------------------------------------
 1 | import type { PluginOption } from "vite";
 2 | 
 3 | export default function customDynamicImport(): PluginOption {
 4 |   return {
 5 |     name: "custom-dynamic-import",
 6 |     renderDynamicImport({ moduleId }) {
 7 |       if (!moduleId.includes("node_modules") && process.env.__FIREFOX__) {
 8 |         return {
 9 |           left: `import(browser.runtime.getURL('./') + `,
10 |           right: ".split('../').join(''));",
11 |         };
12 |       }
13 |       return {
14 |         left: "import(",
15 |         right: ")",
16 |       };
17 |     },
18 |   };
19 | }
20 | 


--------------------------------------------------------------------------------
/utils/plugins/inline-vite-preload-script.ts:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * solution for multiple content scripts
 3 |  * https://github.com/Jonghakseo/chrome-extension-boilerplate-react-vite/issues/177#issuecomment-1784112536
 4 |  */
 5 | export default function inlineVitePreloadScript() {
 6 |   let __vitePreload = "";
 7 |   return {
 8 |     name: "replace-vite-preload-script-plugin",
 9 |     // @ts-expect-error: vite types are not up-to-date
10 |     async renderChunk(code, chunk, options, meta) {
11 |       if (!/content/.test(chunk.fileName.toLowerCase())) {
12 |         return null;
13 |       }
14 |       const chunkName: string | undefined = Object.keys(meta.chunks).find(
15 |         (key) => /preload/.test(key),
16 |       );
17 |       if (!chunkName) {
18 |         return null;
19 |       }
20 |       const modules = meta.chunks[chunkName].modules;
21 |       console.log(modules);
22 |       if (!__vitePreload) {
23 |         __vitePreload = modules[Object.keys(modules)[0]].code;
24 |         __vitePreload = __vitePreload.replaceAll("const ", "var ");
25 |       }
26 |       return {
27 |         code: __vitePreload + code.split(`\n`).slice(1).join(`\n`),
28 |       };
29 |     },
30 |   };
31 | }
32 | 


--------------------------------------------------------------------------------
/utils/plugins/make-manifest.ts:
--------------------------------------------------------------------------------
 1 | import * as fs from "fs";
 2 | import * as path from "path";
 3 | import colorLog from "../log";
 4 | import ManifestParser from "../manifest-parser";
 5 | import type { PluginOption } from "vite";
 6 | import url from "url";
 7 | import * as process from "process";
 8 | 
 9 | const { resolve } = path;
10 | 
11 | const rootDir = resolve(__dirname, "..", "..");
12 | const distDir = resolve(rootDir, "dist");
13 | const manifestFile = resolve(rootDir, "manifest.js");
14 | 
15 | const getManifestWithCacheBurst = (): Promise<{
16 |   default: chrome.runtime.ManifestV3;
17 | }> => {
18 |   const withCacheBurst = (path: string) => `${path}?${Date.now().toString()}`;
19 |   /**
20 |    * In Windows, import() doesn't work without file:// protocol.
21 |    * So, we need to convert path to file:// protocol. (url.pathToFileURL)
22 |    */
23 |   if (process.platform === "win32") {
24 |     return import(withCacheBurst(url.pathToFileURL(manifestFile).href));
25 |   }
26 |   return import(withCacheBurst(manifestFile));
27 | };
28 | 
29 | export default function makeManifest(config: {
30 |   contentScriptCssKey?: string;
31 | }): PluginOption {
32 |   const { contentScriptCssKey } = config;
33 |   function makeManifest(manifest: chrome.runtime.ManifestV3, to: string) {
34 |     if (!fs.existsSync(to)) {
35 |       fs.mkdirSync(to);
36 |     }
37 |     const manifestPath = resolve(to, "manifest.json");
38 | 
39 |     // Naming change for cache invalidation
40 |     if (contentScriptCssKey) {
41 |       manifest?.content_scripts?.forEach((script) => {
42 |         script.css = script?.css?.map((css) =>
43 |           css.replace("<KEY>", contentScriptCssKey),
44 |         );
45 |       });
46 |     }
47 | 
48 |     fs.writeFileSync(
49 |       manifestPath,
50 |       ManifestParser.convertManifestToString(manifest),
51 |     );
52 | 
53 |     colorLog(`Manifest file copy complete: ${manifestPath}`, "success");
54 |   }
55 | 
56 |   return {
57 |     name: "make-manifest",
58 |     buildStart() {
59 |       this.addWatchFile(manifestFile);
60 |     },
61 |     async writeBundle() {
62 |       const manifest = await getManifestWithCacheBurst();
63 |       makeManifest(manifest.default, distDir);
64 |     },
65 |   };
66 | }
67 | 


--------------------------------------------------------------------------------
/utils/plugins/watch-rebuild.ts:
--------------------------------------------------------------------------------
 1 | import type { PluginOption } from "vite";
 2 | import { WebSocket } from "ws";
 3 | import MessageInterpreter from "../reload/interpreter";
 4 | import { LOCAL_RELOAD_SOCKET_URL } from "../reload/constant";
 5 | 
 6 | export default function watchRebuild(config: {
 7 |   whenWriteBundle: () => void;
 8 | }): PluginOption {
 9 |   const ws = new WebSocket(LOCAL_RELOAD_SOCKET_URL);
10 |   return {
11 |     name: "watch-rebuild",
12 |     writeBundle() {
13 |       /**
14 |        * When the build is complete, send a message to the reload server.
15 |        * The reload server will send a message to the client to reload or refresh the extension.
16 |        */
17 |       ws.send(MessageInterpreter.send({ type: "build_complete" }));
18 |       config.whenWriteBundle();
19 |     },
20 |   };
21 | }
22 | 


--------------------------------------------------------------------------------
/utils/reload/constant.ts:
--------------------------------------------------------------------------------
1 | export const LOCAL_RELOAD_SOCKET_PORT = 8082;
2 | export const LOCAL_RELOAD_SOCKET_URL = `ws://localhost:${LOCAL_RELOAD_SOCKET_PORT}`;
3 | 


--------------------------------------------------------------------------------
/utils/reload/initReloadClient.ts:
--------------------------------------------------------------------------------
 1 | import { LOCAL_RELOAD_SOCKET_URL } from "./constant";
 2 | import MessageInterpreter from "./interpreter";
 3 | 
 4 | let needToUpdate = false;
 5 | 
 6 | export default function initReloadClient({
 7 |   watchPath,
 8 |   onUpdate,
 9 |   onForceReload,
10 | }: {
11 |   watchPath: string;
12 |   onUpdate: () => void;
13 |   onForceReload?: () => void;
14 | }): WebSocket {
15 |   const socket = new WebSocket(LOCAL_RELOAD_SOCKET_URL);
16 | 
17 |   function sendUpdateCompleteMessage() {
18 |     socket.send(MessageInterpreter.send({ type: "done_update" }));
19 |   }
20 | 
21 |   socket.addEventListener("message", (event) => {
22 |     const message = MessageInterpreter.receive(String(event.data));
23 | 
24 |     switch (message.type) {
25 |       case "do_update": {
26 |         if (needToUpdate) {
27 |           sendUpdateCompleteMessage();
28 |           needToUpdate = false;
29 |           onUpdate();
30 |         }
31 |         return;
32 |       }
33 |       case "wait_update": {
34 |         if (!needToUpdate) {
35 |           needToUpdate = message.path.includes(watchPath);
36 |         }
37 |         return;
38 |       }
39 |       case "force_reload": {
40 |         onForceReload?.();
41 |         return;
42 |       }
43 |     }
44 |   });
45 | 
46 |   socket.onclose = () => {
47 |     console.log(
48 |       `Reload server disconnected.\nPlease check if the WebSocket server is running properly on ${LOCAL_RELOAD_SOCKET_URL}. This feature detects changes in the code and helps the browser to reload the extension or refresh the current tab.`,
49 |     );
50 |     setTimeout(() => {
51 |       initReloadClient({ watchPath, onUpdate });
52 |     }, 1000);
53 |   };
54 | 
55 |   return socket;
56 | }
57 | 


--------------------------------------------------------------------------------
/utils/reload/initReloadServer.ts:
--------------------------------------------------------------------------------
 1 | import { WebSocket, WebSocketServer } from "ws";
 2 | import chokidar from "chokidar";
 3 | import { LOCAL_RELOAD_SOCKET_PORT, LOCAL_RELOAD_SOCKET_URL } from "./constant";
 4 | import MessageInterpreter from "./interpreter";
 5 | import { debounce } from "./utils";
 6 | 
 7 | const clientsThatNeedToUpdate: Set<WebSocket> = new Set();
 8 | let needToForceReload = false;
 9 | 
10 | function initReloadServer() {
11 |   const wss = new WebSocketServer({ port: LOCAL_RELOAD_SOCKET_PORT });
12 | 
13 |   wss.on("listening", () =>
14 |     console.log(`[HRS] Server listening at ${LOCAL_RELOAD_SOCKET_URL}`),
15 |   );
16 | 
17 |   wss.on("connection", (ws) => {
18 |     clientsThatNeedToUpdate.add(ws);
19 | 
20 |     ws.addEventListener("close", () => clientsThatNeedToUpdate.delete(ws));
21 |     ws.addEventListener("message", (event) => {
22 |       if (typeof event.data !== "string") return;
23 | 
24 |       const message = MessageInterpreter.receive(event.data);
25 | 
26 |       if (message.type === "done_update") {
27 |         ws.close();
28 |       }
29 |       if (message.type === "build_complete") {
30 |         clientsThatNeedToUpdate.forEach((ws: WebSocket) =>
31 |           ws.send(MessageInterpreter.send({ type: "do_update" })),
32 |         );
33 |         if (needToForceReload) {
34 |           needToForceReload = false;
35 |           clientsThatNeedToUpdate.forEach((ws: WebSocket) =>
36 |             ws.send(MessageInterpreter.send({ type: "force_reload" })),
37 |           );
38 |         }
39 |       }
40 |     });
41 |   });
42 | }
43 | 
44 | /** CHECK:: src file was updated **/
45 | const debounceSrc = debounce(function (path: string) {
46 |   // Normalize path on Windows
47 |   const pathConverted = path.replace(/\\/g, "/");
48 |   clientsThatNeedToUpdate.forEach((ws: WebSocket) =>
49 |     ws.send(
50 |       MessageInterpreter.send({ type: "wait_update", path: pathConverted }),
51 |     ),
52 |   );
53 | }, 100);
54 | chokidar
55 |   .watch("src", { ignorePermissionErrors: true })
56 |   .on("all", (_, path) => debounceSrc(path));
57 | 
58 | /** CHECK:: manifest.js was updated **/
59 | chokidar
60 |   .watch("manifest.js", { ignorePermissionErrors: true })
61 |   .on("all", () => {
62 |     needToForceReload = true;
63 |   });
64 | 
65 | initReloadServer();
66 | 


--------------------------------------------------------------------------------
/utils/reload/injections/script.ts:
--------------------------------------------------------------------------------
 1 | import initReloadClient from "../initReloadClient";
 2 | 
 3 | export default function addHmrIntoScript(watchPath: string) {
 4 |   const reload = () => {
 5 |     chrome.runtime.reload();
 6 |   };
 7 | 
 8 |   initReloadClient({
 9 |     watchPath,
10 |     onUpdate: reload,
11 |     onForceReload: reload,
12 |   });
13 | }
14 | 


--------------------------------------------------------------------------------
/utils/reload/injections/view.ts:
--------------------------------------------------------------------------------
 1 | import initReloadClient from "../initReloadClient";
 2 | 
 3 | export default function addHmrIntoView(watchPath: string) {
 4 |   let pendingReload = false;
 5 | 
 6 |   initReloadClient({
 7 |     watchPath,
 8 |     onUpdate: () => {
 9 |       // disable reload when tab is hidden
10 |       if (document.hidden) {
11 |         pendingReload = true;
12 |         return;
13 |       }
14 |       reload();
15 |     },
16 |   });
17 | 
18 |   // reload
19 |   function reload(): void {
20 |     pendingReload = false;
21 |     window.location.reload();
22 |   }
23 | 
24 |   // reload when tab is visible
25 |   function reloadWhenTabIsVisible(): void {
26 |     !document.hidden && pendingReload && reload();
27 |   }
28 |   document.addEventListener("visibilitychange", reloadWhenTabIsVisible);
29 | }
30 | 


--------------------------------------------------------------------------------
/utils/reload/interpreter/index.ts:
--------------------------------------------------------------------------------
 1 | import type { WebSocketMessage, SerializedMessage } from "./types";
 2 | 
 3 | export default class MessageInterpreter {
 4 |   // eslint-disable-next-line @typescript-eslint/no-empty-function
 5 |   private constructor() {}
 6 | 
 7 |   static send(message: WebSocketMessage): SerializedMessage {
 8 |     return JSON.stringify(message);
 9 |   }
10 |   static receive(serializedMessage: SerializedMessage): WebSocketMessage {
11 |     return JSON.parse(serializedMessage);
12 |   }
13 | }
14 | 


--------------------------------------------------------------------------------
/utils/reload/interpreter/types.ts:
--------------------------------------------------------------------------------
 1 | type UpdatePendingMessage = {
 2 |   type: "wait_update";
 3 |   path: string;
 4 | };
 5 | type UpdateRequestMessage = {
 6 |   type: "do_update";
 7 | };
 8 | type UpdateCompleteMessage = { type: "done_update" };
 9 | type BuildCompletionMessage = { type: "build_complete" };
10 | type ForceReloadMessage = { type: "force_reload" };
11 | 
12 | export type SerializedMessage = string;
13 | export type WebSocketMessage =
14 |   | UpdateCompleteMessage
15 |   | UpdateRequestMessage
16 |   | UpdatePendingMessage
17 |   | BuildCompletionMessage
18 |   | ForceReloadMessage;
19 | 


--------------------------------------------------------------------------------
/utils/reload/rollup.config.mjs:
--------------------------------------------------------------------------------
 1 | import typescript from "@rollup/plugin-typescript";
 2 | 
 3 | const plugins = [typescript()];
 4 | 
 5 | export default [
 6 |   {
 7 |     plugins,
 8 |     input: "utils/reload/initReloadServer.ts",
 9 |     output: {
10 |       file: "utils/reload/initReloadServer.js",
11 |     },
12 |     external: ["ws", "chokidar", "timers"],
13 |   },
14 |   {
15 |     plugins,
16 |     input: "utils/reload/injections/script.ts",
17 |     output: {
18 |       file: "utils/reload/injections/script.js",
19 |     },
20 |   },
21 |   {
22 |     plugins,
23 |     input: "utils/reload/injections/view.ts",
24 |     output: {
25 |       file: "utils/reload/injections/view.js",
26 |     },
27 |   },
28 | ];
29 | 


--------------------------------------------------------------------------------
/utils/reload/utils.ts:
--------------------------------------------------------------------------------
 1 | import { clearTimeout } from "timers";
 2 | 
 3 | export function debounce<A extends unknown[]>(
 4 |   callback: (...args: A) => void,
 5 |   delay: number,
 6 | ) {
 7 |   let timer: NodeJS.Timeout;
 8 |   return function (...args: A) {
 9 |     clearTimeout(timer);
10 |     timer = setTimeout(() => callback(...args), delay);
11 |   };
12 | }
13 | 


--------------------------------------------------------------------------------
/vite.config.ts:
--------------------------------------------------------------------------------
 1 | import { defineConfig } from "vite";
 2 | import react from "@vitejs/plugin-react";
 3 | import path, { resolve } from "path";
 4 | import makeManifest from "./utils/plugins/make-manifest";
 5 | import customDynamicImport from "./utils/plugins/custom-dynamic-import";
 6 | import addHmr from "./utils/plugins/add-hmr";
 7 | import inlineVitePreloadScript from "./utils/plugins/inline-vite-preload-script";
 8 | 
 9 | const rootDir = resolve(__dirname);
10 | const srcDir = resolve(rootDir, "src");
11 | const pagesDir = resolve(srcDir, "pages");
12 | const assetsDir = resolve(srcDir, "assets");
13 | const outDir = resolve(rootDir, "dist");
14 | const publicDir = resolve(rootDir, "public");
15 | 
16 | const isDev = process.env.__DEV__ === "true";
17 | const isProduction = !isDev;
18 | 
19 | // ENABLE HMR IN BACKGROUND SCRIPT
20 | const enableHmrInBackgroundScript = true;
21 | 
22 | export default defineConfig({
23 |   resolve: {
24 |     alias: {
25 |       "@root": rootDir,
26 |       "@src": srcDir,
27 |       "@assets": assetsDir,
28 |       "@pages": pagesDir,
29 |     },
30 |   },
31 |   plugins: [
32 |     makeManifest({}),
33 |     react(),
34 |     customDynamicImport(),
35 |     addHmr({ background: enableHmrInBackgroundScript, view: true }),
36 |     inlineVitePreloadScript(),
37 |   ],
38 |   publicDir,
39 |   build: {
40 |     outDir,
41 |     /** Can slow down build speed. */
42 |     // sourcemap: isDev,
43 |     minify: isProduction,
44 |     modulePreload: false,
45 |     reportCompressedSize: isProduction,
46 |     emptyOutDir: !isDev,
47 |     rollupOptions: {
48 |       input: {
49 |         devtools: resolve(pagesDir, "devtools", "index.html"),
50 |         panel: resolve(pagesDir, "panel", "index.html"),
51 |         background: resolve(pagesDir, "background", "index.ts"),
52 |         content: resolve(pagesDir, "content", "index.ts"),
53 |         contentStyleGlobal: resolve(pagesDir, "content", "style.global.scss"),
54 |         contentStyle: resolve(pagesDir, "content", "style.scss"),
55 |         contentInjected: resolve(pagesDir, "content/mainWorld", "index.ts"),
56 |         permission: resolve(pagesDir, "permission", "index.html"),
57 |         popup: resolve(pagesDir, "popup", "index.html"),
58 |         newtab: resolve(pagesDir, "newtab", "index.html"),
59 |         options: resolve(pagesDir, "options", "index.html"),
60 |         sidepanel: resolve(pagesDir, "sidepanel", "index.html"),
61 |       },
62 |       output: {
63 |         entryFileNames: "src/pages/[name]/index.js",
64 |         chunkFileNames: isDev
65 |           ? "assets/js/[name].js"
66 |           : "assets/js/[name].[hash].js",
67 |         assetFileNames: (assetInfo) => {
68 |           const { name, ext } = path.parse(assetInfo.name ?? "");
69 |           if (isFont(ext)) {
70 |             return `assets/fonts/${name}${ext}`;
71 |           }
72 |           return `assets/[ext]/[name].[ext]`;
73 |         },
74 |       },
75 |     },
76 |   },
77 | });
78 | 
79 | function isFont(ext: string): boolean {
80 |   return /^\.(woff2?|eot|ttf|otf)$/.test(ext);
81 | }
82 | 


--------------------------------------------------------------------------------