├── .github
    ├── ISSUE_TEMPLATE
    │   ├── bug_report.md
    │   └── feature_request.md
    └── workflows
    │   └── python-package.yml
├── .gitignore
├── Dockerfile
├── LICENSE.md
├── MANIFEST.in
├── README.md
├── chainforge
    ├── __init__.py
    ├── app.py
    ├── examples
    │   ├── animal-images.cforge
    │   ├── audit-bias.cforge
    │   ├── basic-comparison.cforge
    │   ├── basic-function-calls.cforge
    │   ├── basic-math.cforge
    │   ├── book-beginnings.cforge
    │   ├── chaining-prompts.cforge
    │   ├── chat-sycophancy.cforge
    │   ├── compare-prompts.cforge
    │   ├── comparing-formats.cforge
    │   ├── comparing-system-msg.cforge
    │   ├── custom_provider_cohere.py
    │   ├── mosquito-knowledge.cforge
    │   ├── prompt-injection-test.cforge
    │   ├── python-coding-eval.cforge
    │   ├── red-team-stereotypes.cforge
    │   ├── structured-outputs.cforge
    │   └── tweet-multi-eval.cforge
    ├── flask_app.py
    ├── oaievals
    │   ├── 2d_movement.cforge
    │   ├── README.md
    │   ├── adultery_state_laws.cforge
    │   ├── afrikaans-lexicon.cforge
    │   ├── aime_evaluation.cforge
    │   ├── algebra-word-problems.cforge
    │   ├── ambiguous-sentences.cforge
    │   ├── arithmetical_puzzles.cforge
    │   ├── asl-classifiers.cforge
    │   ├── atpl_exams.cforge
    │   ├── balance-chemical-equation.cforge
    │   ├── banking77.cforge
    │   ├── beam-analysis.cforge
    │   ├── belarusian-grammar.cforge
    │   ├── belarusian-lexicon.cforge
    │   ├── belarusian-proverbs.cforge
    │   ├── belarusian-russian-translation.cforge
    │   ├── belarusian-syllable-count.cforge
    │   ├── belarusian-synonyms.cforge
    │   ├── bitwise.cforge
    │   ├── body-movement.cforge
    │   ├── born-first.cforge
    │   ├── brazilian_laws.cforge
    │   ├── building_floorplan.cforge
    │   ├── bulgarian-lexicon.cforge
    │   ├── canto_wu_pronunciation.cforge
    │   ├── chess-piece-count.cforge
    │   ├── chess.cforge
    │   ├── chinese_tang_poetries.cforge
    │   ├── chinese_zodiac.cforge
    │   ├── color_theory_complementary.cforge
    │   ├── compare-countries-area.cforge
    │   ├── comprehensive-graph-reasoning.cforge
    │   ├── contents.json
    │   ├── count_intersections_polynomial.cforge
    │   ├── count_token_freq_dna.cforge
    │   ├── counterfactual-reasoning.cforge
    │   ├── countries.cforge
    │   ├── crepe.cforge
    │   ├── cricket_situations.cforge
    │   ├── crontab.cforge
    │   ├── cube-pack.cforge
    │   ├── date-booking.cforge
    │   ├── date-calculator.cforge
    │   ├── day-of-week-from-date.cforge
    │   ├── determinant.cforge
    │   ├── diagrammatic_logic.cforge
    │   ├── directions.cforge
    │   ├── dna-melting-calculation.cforge
    │   ├── dutch-lexicon.cforge
    │   ├── emoji-riddle.cforge
    │   ├── escher-sentences.cforge
    │   ├── european-date-format-challenge.cforge
    │   ├── fcc_amateur_extra.cforge
    │   ├── finance.cforge
    │   ├── financial-derivatives.cforge
    │   ├── find-letter.cforge
    │   ├── find-thirukkural.cforge
    │   ├── find_country_from_svg.cforge
    │   ├── finnish-rhyme.cforge
    │   ├── first-letters.cforge
    │   ├── food.cforge
    │   ├── formal-grammar-to-regex.cforge
    │   ├── french-lexicon.cforge
    │   ├── french-part-of-speech.cforge
    │   ├── geometry_puzzle.cforge
    │   ├── german-part-of-speech.cforge
    │   ├── gol.cforge
    │   ├── greek-vocabulary.cforge
    │   ├── guess-the-singer.cforge
    │   ├── heart-disease.cforge
    │   ├── hebrew-bible.cforge
    │   ├── hebrew-rhyme.cforge
    │   ├── hebrew-same-noun-gender.cforge
    │   ├── hindi_shuddha.cforge
    │   ├── hindi_words.cforge
    │   ├── historical-kana-orthography-reading.cforge
    │   ├── imperial_date_to_string.cforge
    │   ├── indonesian_numbers.cforge
    │   ├── infiniteloop-match.cforge
    │   ├── internal_representations.cforge
    │   ├── invert_word_wise.cforge
    │   ├── invoice_due_date_leap_day_adjustment.cforge
    │   ├── irony.cforge
    │   ├── islands.cforge
    │   ├── isosceles-right-triangle.cforge
    │   ├── italian-new-words.cforge
    │   ├── italian-rhyme.cforge
    │   ├── japanese-itpassport-exam01.cforge
    │   ├── japanese-national-medical-exam01.cforge
    │   ├── japanese-national-medical-exam02.cforge
    │   ├── japanese_driving_license.cforge
    │   ├── japanese_number_reading.cforge
    │   ├── japanese_populer_video_game_title_and_the_publisher.cforge
    │   ├── jee-math.cforge
    │   ├── job_listing_title_for_a_caregiver_in_japan.cforge
    │   ├── json_patch_object.cforge
    │   ├── kanji-idioms.cforge
    │   ├── korean-consonant-vowel-combination.cforge
    │   ├── korean_spelling.cforge
    │   ├── korean_yaminjeongeum.cforge
    │   ├── largest_country.cforge
    │   ├── last-word-nth.cforge
    │   ├── lat_long_identify.cforge
    │   ├── linear-equations.cforge
    │   ├── list_comparison_missing_name.cforge
    │   ├── logic-statements.cforge
    │   ├── logiqa.cforge
    │   ├── mandaliof-table.cforge
    │   ├── map-electronic-component-part-to-fact.cforge
    │   ├── mate-in-one.cforge
    │   ├── matrix-mult-rows.cforge
    │   ├── medmcqa.cforge
    │   ├── missing-operators.cforge
    │   ├── moral_exceptQA.cforge
    │   ├── multi-step-equations.cforge
    │   ├── multistep-word-problems.cforge
    │   ├── music-theory-chord-notes.cforge
    │   ├── music_theory_scale_modes.cforge
    │   ├── nepali-song-singer.cforge
    │   ├── newsology.cforge
    │   ├── next-val-series.cforge
    │   ├── norwegian-lexicon.cforge
    │   ├── number-pattern.cforge
    │   ├── number-reading.cforge
    │   ├── numbers_game.cforge
    │   ├── numeral-type-comparisons.cforge
    │   ├── ordered-history-events.cforge
    │   ├── partially_solved_crossword_clues.cforge
    │   ├── passing-balls.cforge
    │   ├── pattern_identification.cforge
    │   ├── ph_calculation.cforge
    │   ├── physics-interaction.cforge
    │   ├── points-on-line.cforge
    │   ├── poker_analysis.cforge
    │   ├── polish-lexicon.cforge
    │   ├── polish-syllable-count.cforge
    │   ├── portuguese-sarcasm.cforge
    │   ├── portuguese-syllable-count.cforge
    │   ├── probability_questions.cforge
    │   ├── pure_korean.cforge
    │   ├── python_list_comprehension.cforge
    │   ├── rare-and-loanwords-dutch-lexicon.cforge
    │   ├── regex-match.cforge
    │   ├── resistor-ohm-calculator.cforge
    │   ├── reverse-polish-notation.cforge
    │   ├── reverse-string.cforge
    │   ├── rhetorical-devices.cforge
    │   ├── rock-climbing.cforge
    │   ├── rot13.cforge
    │   ├── russian-english-homonym-context-resolution.cforge
    │   ├── russian-lexicon.cforge
    │   ├── russian-rhyme.cforge
    │   ├── russian_medical.cforge
    │   ├── seating_arrangements.cforge
    │   ├── shape-in-shape.cforge
    │   ├── shared-borders.cforge
    │   ├── shopping_discount_comparison.cforge
    │   ├── simple-knowledge-mongolian.cforge
    │   ├── simple_physics_engine.cforge
    │   ├── solve-for-variable.cforge
    │   ├── sort-numeric.cforge
    │   ├── south-african-bands.cforge
    │   ├── spanish_feminine_noun_masculine_article.cforge
    │   ├── split_chinese_characters.cforge
    │   ├── squares-gpt.cforge
    │   ├── stats-tests.cforge
    │   ├── svg_understanding.cforge
    │   ├── swap-words.cforge
    │   ├── swedish-spelling.cforge
    │   ├── swedish_sat.cforge
    │   ├── syllables_long_words.cforge
    │   ├── syntax-check.cforge
    │   ├── taxes.cforge
    │   ├── tempo_to_measure_count.cforge
    │   ├── test-comp-sci.cforge
    │   ├── test_japanese_radical.cforge
    │   ├── test_japanese_units.cforge
    │   ├── tetris.cforge
    │   ├── three-pt-mapping.cforge
    │   ├── track_objects.cforge
    │   ├── tracking-shuffled-objects.cforge
    │   ├── turkish_characters.cforge
    │   ├── unified-patch.cforge
    │   ├── unsolvable_questions.cforge
    │   ├── utility_price_parsing.cforge
    │   ├── vigenere.cforge
    │   ├── vintage_phone_keyboard_decode.cforge
    │   ├── which-is-heavier.cforge
    │   ├── wkt_understanding.cforge
    │   └── word_vector_over_reliance.cforge
    ├── providers
    │   ├── __init__.py
    │   └── protocol.py
    ├── react-server
    │   ├── .eslintrc.js
    │   ├── .gitignore
    │   ├── .nvmrc
    │   ├── .prettierignore
    │   ├── .prettierrc.json
    │   ├── README.md
    │   ├── craco.config.js
    │   ├── package-lock.json
    │   ├── package.json
    │   ├── public
    │   │   ├── favicon.ico
    │   │   ├── index.html
    │   │   ├── logo192.png
    │   │   ├── logo512.png
    │   │   ├── manifest.json
    │   │   └── robots.txt
    │   ├── src
    │   │   ├── AiPopover.tsx
    │   │   ├── AlertModal.tsx
    │   │   ├── App.css
    │   │   ├── App.tsx
    │   │   ├── AreYouSureModal.tsx
    │   │   ├── BaseNode.tsx
    │   │   ├── ChatHistoryView.tsx
    │   │   ├── CodeEvaluatorNode.tsx
    │   │   ├── ColorThemeProvider.tsx
    │   │   ├── CommentNode.tsx
    │   │   ├── EditableTable.tsx
    │   │   ├── EvalGen
    │   │   │   ├── EvalGenWizard.tsx
    │   │   │   ├── FeedbackStep.tsx
    │   │   │   ├── GradeResponsesStep.tsx
    │   │   │   ├── GradingView.tsx
    │   │   │   ├── PickCriteriaStep.tsx
    │   │   │   ├── ReportCardStep.tsx
    │   │   │   └── WelcomeStep.tsx
    │   │   ├── ExampleFlowsModal.tsx
    │   │   ├── FlowSidebar.tsx
    │   │   ├── GlobalSettingsModal.tsx
    │   │   ├── ImagePreviewModal.tsx
    │   │   ├── InspectFooter.tsx
    │   │   ├── InspectorNode.tsx
    │   │   ├── ItemsNode.tsx
    │   │   ├── JoinNode.tsx
    │   │   ├── LLMEvalNode.tsx
    │   │   ├── LLMItemButtonGroup.tsx
    │   │   ├── LLMListComponent.tsx
    │   │   ├── LLMListItem.tsx
    │   │   ├── LLMResponseInspector.tsx
    │   │   ├── LLMResponseInspectorDrawer.tsx
    │   │   ├── LLMResponseInspectorModal.tsx
    │   │   ├── MediaNode.tsx
    │   │   ├── ModelSettingSchemas.tsx
    │   │   ├── ModelSettingsModal.tsx
    │   │   ├── MultiEvalNode.tsx
    │   │   ├── NestedMenu.tsx
    │   │   ├── NodeLabelComponent.tsx
    │   │   ├── PlotLegend.tsx
    │   │   ├── PromptNode.tsx
    │   │   ├── RemoveEdge.tsx
    │   │   ├── RenameValueModal.tsx
    │   │   ├── RequestClarificationModal.tsx
    │   │   ├── ResponseBoxes.tsx
    │   │   ├── ResponseRatingToolbar.tsx
    │   │   ├── ScriptNode.tsx
    │   │   ├── SimpleEvalNode.tsx
    │   │   ├── SplitNode.tsx
    │   │   ├── StatusIndicatorComponent.tsx
    │   │   ├── StrictModeDroppable.js
    │   │   ├── TabularDataNode.tsx
    │   │   ├── TemplateHooksComponent.tsx
    │   │   ├── TextFieldsNode.tsx
    │   │   ├── UploadFileModal.tsx
    │   │   ├── VisNode.tsx
    │   │   ├── backend
    │   │   │   ├── __test__
    │   │   │   │   ├── ai.test.ts
    │   │   │   │   ├── aiSuggestionsManager.test.ts
    │   │   │   │   ├── backend.test.ts
    │   │   │   │   ├── cache.test.ts
    │   │   │   │   ├── query.test.ts
    │   │   │   │   ├── setUtils.test.ts
    │   │   │   │   ├── template.test.ts
    │   │   │   │   └── utils.test.ts
    │   │   │   ├── ai.ts
    │   │   │   ├── aiSuggestionsManager.ts
    │   │   │   ├── backend.ts
    │   │   │   ├── cache.ts
    │   │   │   ├── canceler.ts
    │   │   │   ├── errors.ts
    │   │   │   ├── evalgen
    │   │   │   │   ├── README.md
    │   │   │   │   ├── executor.ts
    │   │   │   │   ├── oai_utils.ts
    │   │   │   │   ├── test.ts
    │   │   │   │   ├── typing.ts
    │   │   │   │   └── utils.ts
    │   │   │   ├── models.ts
    │   │   │   ├── pyodide
    │   │   │   │   ├── exec-py.js
    │   │   │   │   └── exec-py.worker.js
    │   │   │   ├── query.ts
    │   │   │   ├── setUtils.ts
    │   │   │   ├── tableUtils.ts
    │   │   │   ├── template.ts
    │   │   │   ├── typing.ts
    │   │   │   └── utils.ts
    │   │   ├── example_flows.tsx
    │   │   ├── index.css
    │   │   ├── index.js
    │   │   ├── logo.svg
    │   │   ├── reportWebVitals.js
    │   │   ├── setupTests.js
    │   │   ├── store.tsx
    │   │   └── styles.css
    │   └── tsconfig.json
    ├── requirements.txt
    └── security
    │   ├── __init__.py
    │   ├── password_utils.py
    │   └── secure_save.py
└── setup.py


/.github/ISSUE_TEMPLATE/bug_report.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Bug report
 3 | about: Create a report to help us improve
 4 | title: ''
 5 | labels: ''
 6 | assignees: ''
 7 | 
 8 | ---
 9 | 
10 | **Describe the bug**
11 | A clear and concise description of what the bug is.
12 | 
13 | **To Reproduce**
14 | Steps to reproduce the behavior:
15 | 1. Go to '...'
16 | 2. Click on '....'
17 | 3. Scroll down to '....'
18 | 4. See error
19 | 
20 | **Expected behavior**
21 | A clear and concise description of what you expected to happen.
22 | 
23 | **Screenshots**
24 | If applicable, add screenshots to help explain your problem.
25 | 
26 | **Desktop (please complete the following information):**
27 |  - OS: [e.g. iOS]
28 |  - Browser [e.g. chrome, safari]
29 |  - Version [e.g. 22]
30 | 
31 | **Smartphone (please complete the following information):**
32 |  - Device: [e.g. iPhone6]
33 |  - OS: [e.g. iOS8.1]
34 |  - Browser [e.g. stock browser, safari]
35 |  - Version [e.g. 22]
36 | 
37 | **Additional context**
38 | Add any other context about the problem here.
39 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/feature_request.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Feature request
 3 | about: Suggest an idea for this project
 4 | title: ''
 5 | labels: ''
 6 | assignees: ''
 7 | 
 8 | ---
 9 | 
10 | **Is your feature request related to a problem? Please describe.**
11 | A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]
12 | 
13 | **Describe the solution you'd like**
14 | A clear and concise description of what you want to happen.
15 | 
16 | **Describe alternatives you've considered**
17 | A clear and concise description of any alternative solutions or features you've considered.
18 | 
19 | **Additional context**
20 | Add any other context or screenshots about the feature request here.
21 | 


--------------------------------------------------------------------------------
/.github/workflows/python-package.yml:
--------------------------------------------------------------------------------
 1 | name: Validate Install
 2 | 
 3 | on:
 4 |   push:
 5 |     branches: [ main ]
 6 |   pull_request:
 7 |     branches: [ main ]
 8 | 
 9 | jobs:
10 |   test:
11 |     runs-on: ${{ matrix.os }}
12 | 
13 |     strategy:
14 |       matrix:
15 |         os: [ubuntu-latest, windows-latest, macos-latest, macos-13, macos-14]
16 |         python-version: [3.11, 3.12, 3.13]
17 |       fail-fast: false
18 | 
19 |     steps:
20 |     - name: Check out the repository
21 |       uses: actions/checkout@v3
22 | 
23 |     - name: Set up Python ${{ matrix.python-version }}
24 |       uses: actions/setup-python@v4
25 |       with:
26 |         python-version: ${{ matrix.python-version }}
27 | 
28 |     - name: Cache pip
29 |       uses: actions/cache@v4
30 |       with:
31 |         path: ~/.cache/pip
32 |         key: ${{ runner.os }}-pip-${{ matrix.python-version }}-${{ hashFiles('chainforge/requirements.txt') }}
33 |         restore-keys: |
34 |           ${{ runner.os }}-pip-${{ matrix.python-version }}-
35 | 
36 |     - name: Upgrade pip
37 |       run: python -m pip install --upgrade pip
38 | 
39 |     - name: Install dependencies
40 |       run: |
41 |         pip install -r chainforge/requirements.txt
42 |         pip install .
43 |         pip install pytest
44 | 
45 |     # TODO: Check that the server runs
46 | 
47 |     # TODO: Add pytest
48 |     # - name: Run tests
49 |     #   run: pytest
50 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | *.DS_Store
  2 | chainforge/cache
  3 | chainforge/examples/oaievals/
  4 | chainforge/react-server/node_modules
  5 | chainforge/react-server/build
  6 | 
  7 | # == Below was generated by https://www.toptal.com/developers/gitignore/api/python ==
  8 | # Edit at https://www.toptal.com/developers/gitignore?templates=python
  9 | 
 10 | ### Python ###
 11 | # Byte-compiled / optimized / DLL files
 12 | __pycache__/
 13 | *.py[cod]
 14 | *$py.class
 15 | 
 16 | # Docker
 17 | packages/
 18 | jobs/
 19 | 
 20 | # C extensions
 21 | *.so
 22 | 
 23 | # Distribution / packaging
 24 | .Python
 25 | develop-eggs/
 26 | dist/
 27 | downloads/
 28 | eggs/
 29 | .eggs/
 30 | lib/
 31 | lib64/
 32 | parts/
 33 | sdist/
 34 | var/
 35 | wheels/
 36 | share/python-wheels/
 37 | *.egg-info/
 38 | .installed.cfg
 39 | *.egg
 40 | MANIFEST
 41 | 
 42 | # PyInstaller
 43 | #  Usually these files are written by a python script from a template
 44 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 45 | *.manifest
 46 | *.spec
 47 | 
 48 | # Installer logs
 49 | pip-log.txt
 50 | pip-delete-this-directory.txt
 51 | 
 52 | # Unit test / coverage reports
 53 | htmlcov/
 54 | .tox/
 55 | .nox/
 56 | .coverage
 57 | .coverage.*
 58 | .cache
 59 | nosetests.xml
 60 | coverage.xml
 61 | *.cover
 62 | *.py,cover
 63 | .hypothesis/
 64 | .pytest_cache/
 65 | cover/
 66 | 
 67 | # Translations
 68 | *.mo
 69 | *.pot
 70 | 
 71 | # Django stuff:
 72 | *.log
 73 | local_settings.py
 74 | db.sqlite3
 75 | db.sqlite3-journal
 76 | 
 77 | # Flask stuff:
 78 | instance/
 79 | .webassets-cache
 80 | 
 81 | # Scrapy stuff:
 82 | .scrapy
 83 | 
 84 | # Sphinx documentation
 85 | docs/_build/
 86 | 
 87 | # PyBuilder
 88 | .pybuilder/
 89 | target/
 90 | 
 91 | # Jupyter Notebook
 92 | .ipynb_checkpoints
 93 | 
 94 | # IPython
 95 | profile_default/
 96 | ipython_config.py
 97 | 
 98 | # pyenv
 99 | #   For a library or package, you might want to ignore these files since the code is
100 | #   intended to run in multiple environments; otherwise, check them in:
101 | # .python-version
102 | 
103 | # pipenv
104 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
105 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
106 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
107 | #   install all needed dependencies.
108 | #Pipfile.lock
109 | 
110 | # poetry
111 | #   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
112 | #   This is especially recommended for binary packages to ensure reproducibility, and is more
113 | #   commonly ignored for libraries.
114 | #   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
115 | #poetry.lock
116 | 
117 | # pdm
118 | #   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
119 | #pdm.lock
120 | #   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
121 | #   in version control.
122 | #   https://pdm.fming.dev/#use-with-ide
123 | .pdm.toml
124 | 
125 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
126 | __pypackages__/
127 | 
128 | # Celery stuff
129 | celerybeat-schedule
130 | celerybeat.pid
131 | 
132 | # SageMath parsed files
133 | *.sage.py
134 | 
135 | # Environments
136 | .env
137 | .venv
138 | env/
139 | venv/
140 | ENV/
141 | env.bak/
142 | venv.bak/
143 | 
144 | # Spyder project settings
145 | .spyderproject
146 | .spyproject
147 | 
148 | # Rope project settings
149 | .ropeproject
150 | 
151 | # mkdocs documentation
152 | /site
153 | 
154 | # mypy
155 | .mypy_cache/
156 | .dmypy.json
157 | dmypy.json
158 | 
159 | # Pyre type checker
160 | .pyre/
161 | 
162 | # pytype static type analyzer
163 | .pytype/
164 | 
165 | # Cython debug symbols
166 | cython_debug/
167 | 
168 | # PyCharm
169 | #  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
170 | #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
171 | #  and can be added to the global gitignore or merged into this file.  For a more nuclear
172 | #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
173 | #.idea/
174 | 
175 | ### Python Patch ###
176 | # Poetry local configuration file - https://python-poetry.org/docs/configuration/#local-configuration
177 | poetry.toml
178 | 
179 | # ruff
180 | .ruff_cache/
181 | 
182 | # LSP config files
183 | pyrightconfig.json
184 | 
185 | # End of https://www.toptal.com/developers/gitignore/api/python
186 | chainforge_assets/
187 | .vscode/
188 | 


--------------------------------------------------------------------------------
/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM python:3.12-slim AS builder
 2 | 
 3 | RUN pip install --upgrade pip
 4 | RUN pip install chainforge --no-cache-dir
 5 | 
 6 | WORKDIR /chainforge
 7 | 
 8 | EXPOSE 8000
 9 | ENTRYPOINT [ "chainforge", "serve", "--host", "0.0.0.0" ]
10 | 


--------------------------------------------------------------------------------
/LICENSE.md:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2023 Ian Arawjo
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/MANIFEST.in:
--------------------------------------------------------------------------------
1 | graft chainforge/react-server/build
2 | graft chainforge/examples
3 | include README.md


--------------------------------------------------------------------------------
/chainforge/__init__.py:
--------------------------------------------------------------------------------
1 | from .app import main
2 | 


--------------------------------------------------------------------------------
/chainforge/app.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | from chainforge.flask_app import run_server
 3 | import textwrap
 4 | 
 5 | # Main Chainforge start
 6 | def main():
 7 |     parser = argparse.ArgumentParser(description='Chainforge command line tool')
 8 | 
 9 |     # Serve command
10 |     subparsers = parser.add_subparsers(dest='serve')
11 |     serve_parser = subparsers.add_parser('serve', help='Start Chainforge server', formatter_class=argparse.RawTextHelpFormatter)
12 | 
13 |     # TODO: Add this back
14 |     # Turn on to disable all outbound LLM API calls and replace them with dummy calls
15 |     # that return random strings of ASCII characters. Useful for testing interface without wasting $$.
16 |     # serve_parser.add_argument('--dummy-responses', 
17 |     #     help="""Disables queries to LLMs, replacing them with spoofed responses composed of random ASCII characters. 
18 |     #             Produces each dummy response at random intervals between 0.1 and 3 seconds.""", 
19 |     #     dest='dummy_responses', 
20 |     #     action='store_true')
21 |     
22 |     # TODO: Reimplement this where the React server is given the backend's port before loading.
23 |     serve_parser.add_argument('--port', 
24 |                               help='The port to run the server on. Defaults to 8000.', 
25 |                               type=int, default=8000, nargs='?')
26 |     serve_parser.add_argument('--host', 
27 |                               help="The host to run the server on. Defaults to 'localhost'.", 
28 |                               type=str, default="localhost", nargs='?')
29 |     serve_parser.add_argument('--dir',
30 |                               help=textwrap.dedent("""\
31 |                                 Set a custom directory to use for saving flows and autosaving.
32 |                                 By default, ChainForge uses the user data location suggested by the `platformdirs` module.
33 |                                 Should be an absolute path."""),
34 |                               type=str,
35 |                               default=None)
36 |     serve_parser.add_argument('--secure', 
37 |                               choices=["off", "settings", "all"],
38 |                               default="off",
39 |                               help=textwrap.dedent("""\
40 |                                 Encrypts locally stored files with a password. 
41 |                                 Encryption modes are:
42 |                                     - off      = no encryption (default)
43 |                                     - settings = only encrypt the settings file (that may contain API keys entered via the UI)
44 |                                     - all      = encrypt all files (flows, settings, favorites, etc)
45 |                                 You must provide a password at every startup.
46 |                                 Ensure that you save your password somewhere, as it is not stored anywhere.
47 |                                 If you lose it, you will not be able to access your files. 
48 |                                 NOTE: Clicking the 'Export' button in the UI will still export a non-encrypted flow, in case you need to share the file in the normal manner. 
49 |                                 This setting is only for local storage.""")
50 |                                )
51 | 
52 |     args = parser.parse_args()
53 | 
54 |     # Currently only support the 'serve' command...
55 |     if not args.serve:
56 |         parser.print_help()
57 |         exit(0)
58 | 
59 |     port = args.port if args.port else 8000
60 |     host = args.host if args.host else "localhost"
61 | 
62 |     if args.dir:
63 |         print(f"Using directory for storing flows: {args.dir}")
64 | 
65 |     print(f"Serving Flask server on {host} on port {port}...")
66 |     run_server(host=host, port=port, flows_dir=args.dir, secure=args.secure)
67 | 
68 | if __name__ == "__main__":
69 |     main()


--------------------------------------------------------------------------------
/chainforge/examples/custom_provider_cohere.py:
--------------------------------------------------------------------------------
 1 | """
 2 |     A simple custom model provider to add to the ChainForge interface,
 3 |     to support Cohere AI text completions through their Python API.
 4 | 
 5 |     NOTE: You must have the `cohere` package installed and an API key.
 6 | """
 7 | from chainforge.providers import provider
 8 | import cohere
 9 | 
10 | # Init the Cohere client (replace with your Cohere API Key)
11 | co = cohere.Client('<YOUR_API_KEY>')
12 | 
13 | # JSON schemas to pass react-jsonschema-form, one for this endpoints' settings and one to describe the settings UI.
14 | COHERE_SETTINGS_SCHEMA = {
15 |   "settings": {
16 |     "temperature": {
17 |       "type": "number",
18 |       "title": "temperature",
19 |       "description": "Controls the 'creativity' or randomness of the response.",
20 |       "default": 0.75,
21 |       "minimum": 0,
22 |       "maximum": 5.0,
23 |       "multipleOf": 0.01,
24 |     },
25 |     "max_tokens": {
26 |       "type": "integer",
27 |       "title": "max_tokens",
28 |       "description": "Maximum number of tokens to generate in the response.",
29 |       "default": 100,
30 |       "minimum": 1,
31 |       "maximum": 1024,
32 |     },
33 |   },
34 |   "ui": {
35 |     "temperature": {
36 |       "ui:help": "Defaults to 1.0.",
37 |       "ui:widget": "range"
38 |     },
39 |     "max_tokens": {
40 |       "ui:help": "Defaults to 100.",
41 |       "ui:widget": "range"
42 |     },
43 |   }
44 | }
45 | 
46 | # Our custom model provider for Cohere's text generation API.
47 | @provider(name="Cohere",
48 |           emoji="🖇", 
49 |           models=['command', 'command-nightly', 'command-light', 'command-light-nightly'],
50 |           rate_limit="sequential", # enter "sequential" for blocking; an integer N > 0 means N is the max mumber of requests per minute. 
51 |           settings_schema=COHERE_SETTINGS_SCHEMA)
52 | def CohereCompletion(prompt: str, model: str, temperature: float = 0.75, **kwargs) -> str:
53 |     print(f"Calling Cohere model {model} with prompt '{prompt}'...")
54 |     response = co.generate(model=model, prompt=prompt, temperature=temperature, **kwargs)
55 |     return response.generations[0].text
56 | 


--------------------------------------------------------------------------------
/chainforge/oaievals/README.md:
--------------------------------------------------------------------------------
 1 | # Preconverted OpenAI evals
 2 | 
 3 | The ChainForge flows in this directory were derived from a subset of OpenAI's evals registry: https://github.com/openai/evals
 4 | These files are _not_ included in the PyPI chainforge package, but rather fetched from GitHub on an as-needed basis.
 5 | This is to avoid requiring users to install OpenAI evals (which requires Git LFS, Python 3.9+, and a large number of dependencies).
 6 | 
 7 | OpenAI evals is under the MIT License:
 8 | 
 9 | MIT License
10 | 
11 | Copyright (c) 2023 OpenAI
12 | 
13 | Permission is hereby granted, free of charge, to any person obtaining a copy
14 | of this software and associated documentation files (the "Software"), to deal
15 | in the Software without restriction, including without limitation the rights
16 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
17 | copies of the Software, and to permit persons to whom the Software is
18 | furnished to do so, subject to the following conditions:
19 | 
20 | The above copyright notice and this permission notice shall be included in all
21 | copies or substantial portions of the Software.
22 | 
23 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
24 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
25 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
26 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
27 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
28 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
29 | SOFTWARE.


--------------------------------------------------------------------------------
/chainforge/oaievals/adultery_state_laws.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-adultery_state_laws", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "You are an assistant with knowledge of U.S. state laws. Answer the questions accurately.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "You are an assistant with knowledge of U.S. state laws. Answer the questions accurately.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-adultery_state_laws", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-adultery_state_laws", "type": "vis", "data": {"input": "eval-adultery_state_laws"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-adultery_state_laws", "type": "inspect", "data": {"input": "prompt-adultery_state_laws"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-adultery_state_laws", "type": "table", "data": {"rows": [{"prompt": "List the states where adultery is technically illegal. Only provide a list of states with no explanation.", "ideal": "Alabama, Arizona, Florida, Idaho, Illinois, Kansas, Michigan, Minnesota, Mississippi, New York, North Carolina, Oklahoma, Rhode Island, South Carolina, Virginia, Wisconsin, Georgia"}, {"prompt": "Is adultery illegal in Alabama?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Arizona?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Florida?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Georgia?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Idaho?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Illinois?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Kansas?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Michigan?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Minnesota?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Mississippi?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in New York?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in North Carolina?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Oklahoma?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Rhode Island?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in South Carolina?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Virginia?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Wisconsin?", "ideal": "Yes"}, {"prompt": "Is adultery illegal in Alaska?", "ideal": "No"}, {"prompt": "List the states where adultery is illegal again. How was your list different now?", "ideal": "Alabama, Arizona, Florida, Idaho, Illinois, Kansas, Michigan, Minnesota, Mississippi, New York, North Carolina, Oklahoma, Rhode Island, South Carolina, Virginia, Wisconsin, Georgia. The list remains the same."}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-adultery_state_laws", "sourceHandle": "prompt", "target": "eval-adultery_state_laws", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-adultery_state_laws", "sourceHandle": "prompt", "target": "inspect-adultery_state_laws", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-adultery_state_laws", "sourceHandle": "output", "target": "vis-adultery_state_laws", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-adultery_state_laws", "sourceHandle": "Prompt", "target": "prompt-adultery_state_laws", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/algebra-word-problems.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-algebra-word-problems", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Answer the following question with a single number and no additional text. You are a helpful assistant.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Answer the following question with a single number and no additional text. You are a helpful assistant.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-algebra-word-problems", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-algebra-word-problems", "type": "vis", "data": {"input": "eval-algebra-word-problems"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-algebra-word-problems", "type": "inspect", "data": {"input": "prompt-algebra-word-problems"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-algebra-word-problems", "type": "table", "data": {"rows": [{"prompt": "If it takes 5 machines 5 minutes to make 5 devices, how long would it take 100 machines to make 100 devices?", "ideal": "5"}, {"prompt": "What is the sum of 60000, 5000, 400, and 3, with the third value multiplied by 5 before performing the operation?", "ideal": "67003"}, {"prompt": "If the sum of the smallest and largest of three consecutive even numbers is 28, what is the value of the second largest number in the series?", "ideal": "14"}, {"prompt": "John is trying to fill a 16 oz. bottle with water. If John fills the bottle at 1 oz per second and the bottle leaks .2 oz per second, how long would it take for John to fill the bottle?", "ideal": "20"}, {"prompt": "Annie is training for a marathon. She has a weekly training routine, training for five hours a day on some days and 3 hours a day on the other days. She trains a total of 27 hours in a seven day week. On how many days does she train for five hours?", "ideal": "3"}, {"prompt": "At the start of the year the ratio of boys to girls in a class is 2 : 1. But now, half a year later, four boys have left the class and there are two new girls. The ratio of boys to girls is now 4 : 3. How many students are there altogether now?", "ideal": "28"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-algebra-word-problems", "sourceHandle": "prompt", "target": "eval-algebra-word-problems", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-algebra-word-problems", "sourceHandle": "prompt", "target": "inspect-algebra-word-problems", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-algebra-word-problems", "sourceHandle": "output", "target": "vis-algebra-word-problems", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-algebra-word-problems", "sourceHandle": "Prompt", "target": "prompt-algebra-word-problems", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/counterfactual-reasoning.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-counterfactual-reasoning", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "You are a helpful assistant.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "You are a helpful assistant.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-counterfactual-reasoning", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet txt = response.text;\n\tlet ideal = response.meta['Ideal'];\n\treturn ideal.includes(txt) || txt.includes(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-counterfactual-reasoning", "type": "vis", "data": {"input": "eval-counterfactual-reasoning"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-counterfactual-reasoning", "type": "inspect", "data": {"input": "prompt-counterfactual-reasoning"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-counterfactual-reasoning", "type": "table", "data": {"rows": [{"prompt": "If the sky flies in a bird, then what does the ground run on?", "ideal": "human"}, {"prompt": "If a song sings a bird, then what does a book read?", "ideal": "human"}, {"prompt": "If the river swims in a fish, then what does a bone chew?", "ideal": "dog"}, {"prompt": "If the earth flows on the river, then what does the sky hangs in?", "ideal": "the sun"}, {"prompt": "If the windmill blows the wind, then what does the grass moisten?", "ideal": "the rain"}, {"prompt": "If the lock unlocks the key, then what does the sheath go in?", "ideal": "the knife or the sword"}, {"prompt": "If the moon means the day, then what does the sun means?", "ideal": "the night"}, {"prompt": "If the black color means bad things, then what does the white color means?", "ideal": "good things"}, {"prompt": "If the black color means a low position, then what does the white color means?", "ideal": "a high position"}, {"prompt": "If the ice feels hot, then what does the fire feel?", "ideal": "cold"}, {"prompt": "If the moon is bigger than the earth, then who is bigger between the earth and the sun?", "ideal": "the earth"}, {"prompt": "If the moon is a cubic object, then what is the shape of the sun?", "ideal": "cube"}, {"prompt": "If chinese food matches Beijing, then what does american food match?", "ideal": "washington"}, {"prompt": "If 1 is less than 2, then is 3 bigger than 4?", "ideal": "yes"}, {"prompt": "If one matches eno, then what does two match?", "ideal": "owt"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-counterfactual-reasoning", "sourceHandle": "prompt", "target": "eval-counterfactual-reasoning", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-counterfactual-reasoning", "sourceHandle": "prompt", "target": "inspect-counterfactual-reasoning", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-counterfactual-reasoning", "sourceHandle": "output", "target": "vis-counterfactual-reasoning", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-counterfactual-reasoning", "sourceHandle": "Prompt", "target": "prompt-counterfactual-reasoning", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/crontab.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-crontab", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Generate a cron expression with 5 fields from the given description. Output the cron expression ONLY and make your answer as short as possible.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Generate a cron expression with 5 fields from the given description. Output the cron expression ONLY and make your answer as short as possible.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-crontab", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-crontab", "type": "vis", "data": {"input": "eval-crontab"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-crontab", "type": "inspect", "data": {"input": "prompt-crontab"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-crontab", "type": "table", "data": {"rows": [{"prompt": "At 04:05.", "ideal": "5 4 * * *"}, {"prompt": "At 00:05 in August.", "ideal": "5 0 * 8 *"}, {"prompt": "At 14:15 on day-of-month 1.", "ideal": "15 14 1 * *"}, {"prompt": "At 22:00 on every day-of-week from Monday through Friday.", "ideal": "0 22 * * 1-5"}, {"prompt": "At minute 23 past every 2nd hour from 0 through 20.", "ideal": "23 0-20/2 * * *"}, {"prompt": "At minute 0 past hour 0 and 12 on day-of-month 1 in every 2nd month.", "ideal": "0 0,12 1 */2 *"}, {"prompt": "At 04:00 on every day-of-month from 8 through 14.", "ideal": "0 4 8-14 * *"}, {"prompt": "At 00:00 on day-of-month 1 and 15 and on Wednesday.", "ideal": "0 0 1,15 * 3"}, {"prompt": "At 04:05 on Sunday.", "ideal": "5 4 * * 0"}, {"prompt": "At every minute.", "ideal": "* * * * *"}, {"prompt": "At every 2nd minute.", "ideal": "*/2 * * * *"}, {"prompt": "At every 2nd minute from 1 through 59.", "ideal": "1-59/2 * * * *"}, {"prompt": "At every 3rd minute.", "ideal": "*/3 * * * *"}, {"prompt": "At every 4th minute.", "ideal": "*/4 * * * *"}, {"prompt": "At every 5th minute.", "ideal": "*/5 * * * *"}, {"prompt": "At minute 30.", "ideal": "30 * * * *"}, {"prompt": "At every 30th minute.", "ideal": "*/30 * * * *"}, {"prompt": "At 00:00 on day-of-month 1 in January.", "ideal": "0 0 1 1 *"}, {"prompt": "At 00:00 on day-of-month 1 in every 6th month.", "ideal": "0 0 1 */6 *"}, {"prompt": "At 00:00 on Saturday and Sunday.", "ideal": "0 0 * * 6,0"}, {"prompt": "At 00:00 on day-of-month 1 in every 3rd month.", "ideal": "0 0 1 */3 *"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-crontab", "sourceHandle": "prompt", "target": "eval-crontab", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-crontab", "sourceHandle": "prompt", "target": "inspect-crontab", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-crontab", "sourceHandle": "output", "target": "vis-crontab", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-crontab", "sourceHandle": "Prompt", "target": "prompt-crontab", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/finnish-rhyme.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-finnish-rhyme", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "For each pair of words, determine whether their Finnish translations rhyme. If they do, output the pair of rhyming words in Finnish. If not, output NONE.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "For each pair of words, determine whether their Finnish translations rhyme. If they do, output the pair of rhyming words in Finnish. If not, output NONE.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-finnish-rhyme", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet txt = response.text;\n\tlet ideal = response.meta['Ideal'];\n\treturn ideal.includes(txt) || txt.includes(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-finnish-rhyme", "type": "vis", "data": {"input": "eval-finnish-rhyme"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-finnish-rhyme", "type": "inspect", "data": {"input": "prompt-finnish-rhyme"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-finnish-rhyme", "type": "table", "data": {"rows": [{"prompt": "boat, Go!", "ideal": "vene, Mene!"}, {"prompt": "snow, rubber", "ideal": "lumi, kumi"}, {"prompt": "car, tasteless", "ideal": "NONE"}, {"prompt": "flower, sock", "ideal": "kukka, sukka"}, {"prompt": "carpet, motto", "ideal": "NONE"}, {"prompt": "moth, butter", "ideal": "koi, voi"}, {"prompt": "ass (animal), glass", "ideal": "NONE"}, {"prompt": "meringue, spirit", "ideal": "marenki, henki"}, {"prompt": "marble, basket", "ideal": "marmori, kori"}, {"prompt": "sea, blood", "ideal": "meri, veri"}, {"prompt": "sea, pal", "ideal": "meri, kaveri"}, {"prompt": "wall, hay", "ideal": "sein\u00e4, hein\u00e4"}, {"prompt": "bottle, ball", "ideal": "NONE"}, {"prompt": "human being, delicious", "ideal": "ihminen, herkullinen"}, {"prompt": "pill, blood", "ideal": "pilleri, veri"}, {"prompt": "book, Norway", "ideal": "NONE"}, {"prompt": "slave, Norway", "ideal": "orja, Norja"}, {"prompt": "climate, mast", "ideal": "ilmasto, masto"}, {"prompt": "room, machine", "ideal": "NONE"}, {"prompt": "sabbath, watt", "ideal": "sapatti, watti"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-finnish-rhyme", "sourceHandle": "prompt", "target": "eval-finnish-rhyme", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-finnish-rhyme", "sourceHandle": "prompt", "target": "inspect-finnish-rhyme", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-finnish-rhyme", "sourceHandle": "output", "target": "vis-finnish-rhyme", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-finnish-rhyme", "sourceHandle": "Prompt", "target": "prompt-finnish-rhyme", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/historical-kana-orthography-reading.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-historical-kana-orthography-reading", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Answer the reading of the word in historical kana orthography with modern kana orthography. Only use hiragana. Do not output any other output at all. If the input is the answer itself, please answer as is.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Answer the reading of the word in historical kana orthography with modern kana orthography. Only use hiragana. Do not output any other output at all. If the input is the answer itself, please answer as is.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-historical-kana-orthography-reading", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-historical-kana-orthography-reading", "type": "vis", "data": {"input": "eval-historical-kana-orthography-reading"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-historical-kana-orthography-reading", "type": "inspect", "data": {"input": "prompt-historical-kana-orthography-reading"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-historical-kana-orthography-reading", "type": "table", "data": {"rows": [{"prompt": "\u304a\u307b\u3057", "ideal": "\u304a\u304a\u3057"}, {"prompt": "\u3042\u3046\u3080", "ideal": "\u304a\u3046\u3080"}, {"prompt": "\u3044\u3046\u306a\u308a", "ideal": "\u3086\u3046\u306a\u308a"}, {"prompt": "\u3048\u3046\u3058", "ideal": "\u3088\u3046\u3058"}, {"prompt": "\u3046\u3064\u304f\u3057\u3046", "ideal": "\u3046\u3064\u304f\u3057\u3085\u3046"}, {"prompt": "\u3044\u3066\u3075", "ideal": "\u3044\u3061\u3087\u3046"}, {"prompt": "\u304f\u308f\u304b\u304f", "ideal": "\u304b\u304b\u304f"}, {"prompt": "\u305b\u3046\u3058\u3093", "ideal": "\u3057\u3087\u3046\u3058\u3093"}, {"prompt": "\u3072\u3080\u304c\u3057", "ideal": "\u3072\u3093\u304c\u3057"}, {"prompt": "\u304f\u308f\u3057", "ideal": "\u304b\u3057"}, {"prompt": "\u3042\u306f\u308c", "ideal": "\u3042\u308f\u308c"}, {"prompt": "\u3091\u3073\u3059", "ideal": "\u3048\u3073\u3059"}, {"prompt": "\u3067\u305b\u3046", "ideal": "\u3067\u3057\u3087\u3046"}, {"prompt": "\u304b\u306f", "ideal": "\u304b\u308f"}, {"prompt": "\u3090\u306a\u304b", "ideal": "\u3044\u306a\u304b"}, {"prompt": "\u3092\u3068\u3053", "ideal": "\u304a\u3068\u3053"}, {"prompt": "\u3066\u3046\u3065", "ideal": "\u3061\u3087\u3046\u305a"}, {"prompt": "\u3082\u3093\u3050\u308f\u3044", "ideal": "\u3082\u3093\u304c\u3044"}, {"prompt": "\u3042\u3075\u304e", "ideal": "\u304a\u3046\u304e"}, {"prompt": "\u3042\u3072\u3065\u3061", "ideal": "\u3042\u3044\u3065\u3061"}, {"prompt": "\u306b\u3064\u304d", "ideal": "\u306b\u3063\u304d"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-historical-kana-orthography-reading", "sourceHandle": "prompt", "target": "eval-historical-kana-orthography-reading", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-historical-kana-orthography-reading", "sourceHandle": "prompt", "target": "inspect-historical-kana-orthography-reading", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-historical-kana-orthography-reading", "sourceHandle": "output", "target": "vis-historical-kana-orthography-reading", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-historical-kana-orthography-reading", "sourceHandle": "Prompt", "target": "prompt-historical-kana-orthography-reading", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/multi-step-equations.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-multi-step-equations", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Solve the following question for x. Answer with a single number and no additional text. You are a helpful assistant.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Solve the following question for x. Answer with a single number and no additional text. You are a helpful assistant.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-multi-step-equations", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-multi-step-equations", "type": "vis", "data": {"input": "eval-multi-step-equations"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-multi-step-equations", "type": "inspect", "data": {"input": "prompt-multi-step-equations"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-multi-step-equations", "type": "table", "data": {"rows": [{"prompt": "8x + 4x = 12", "ideal": "1"}, {"prompt": "-5x - 3x = 16", "ideal": "-2"}, {"prompt": "2x + 4 + 5 = 13", "ideal": "2"}, {"prompt": "-7x - 2x = 0", "ideal": "0"}, {"prompt": "8x + 8 = 8", "ideal": "0"}, {"prompt": "40 = 10x + 10x", "ideal": "2"}, {"prompt": "-15 = \u22122x + 5x", "ideal": "-5"}, {"prompt": "\u221210 = 4(1 + 4x) \u2212 2x", "ideal": "-1"}, {"prompt": "5(\u2212x + 5) = 15", "ideal": "2"}, {"prompt": "\u22122x \u2212 4(1 + 8x) = \u2212174", "ideal": "5"}, {"prompt": "\u22122(4x \u2212 2) = \u22122(2 + 3x)", "ideal": "4"}, {"prompt": "2x \u2212 4(1 + 2x) = \u221224 + 4x", "ideal": "2"}, {"prompt": "\u22122(\u22122x \u2212 4) = \u22124x + 184", "ideal": "22"}, {"prompt": "\u221210 \u2212 5x = 2(5x - 20)", "ideal": "2"}, {"prompt": "\u22122(6x \u2212 2) = \u22122(3 + 5x)", "ideal": "5"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-multi-step-equations", "sourceHandle": "prompt", "target": "eval-multi-step-equations", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-multi-step-equations", "sourceHandle": "prompt", "target": "inspect-multi-step-equations", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-multi-step-equations", "sourceHandle": "output", "target": "vis-multi-step-equations", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-multi-step-equations", "sourceHandle": "Prompt", "target": "prompt-multi-step-equations", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/nepali-song-singer.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-nepali-song-singer", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "A user will give you a English transliteration phrase of Nepali song. Give the name of the singer or band.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "A user will give you a English transliteration phrase of Nepali song. Give the name of the singer or band.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-nepali-song-singer", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.includes(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-nepali-song-singer", "type": "vis", "data": {"input": "eval-nepali-song-singer"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-nepali-song-singer", "type": "inspect", "data": {"input": "prompt-nepali-song-singer"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-nepali-song-singer", "type": "table", "data": {"rows": [{"prompt": "Yo maan ta mero nepali ho", "ideal": "1974 AD"}, {"prompt": "Timro maya le badhera rakha", "ideal": "Ashmita Adhikari"}, {"prompt": "Euta manchhe ko maya le", "ideal": "Narayan Gopal"}, {"prompt": "Kehi mitho baata gara", "ideal": "Narayan Gopal"}, {"prompt": "Mohani Lagla Hai", "ideal": "Narayan Gopal"}, {"prompt": "Biratako Chino", "ideal": "Narayan Gopal"}, {"prompt": "Baneko chha Paharale", "ideal": "Gopal Yonjan"}, {"prompt": "Siran ma photo cha", "ideal": "Nepathya"}, {"prompt": "Bheda ko oon jasto", "ideal": "Nepathya"}, {"prompt": "Thula thula mahal", "ideal": "Karna Das"}, {"prompt": "Anautho betha", "ideal": "Karna Das"}, {"prompt": "Ma Kahile Haseko Thiye", "ideal": "Yash Kumar"}, {"prompt": "Sanjha Pakha", "ideal": "Nabin K Bhattarai"}, {"prompt": "Yehi ho ta maya", "ideal": "Nabin K Bhattarai"}, {"prompt": "Ekanta chha thau", "ideal": "COD"}, {"prompt": "Yo Prasanga", "ideal": "Yama Buddha"}, {"prompt": "Orali lageko", "ideal": "Ram Krishna Dhakal"}, {"prompt": "Malai Yo Zindagi Le", "ideal": "Ram Krishna Dhakal"}, {"prompt": "Pheri Tyo Din", "ideal": "Sugam Pokhrel"}, {"prompt": "Dashain Tihar", "ideal": "Sugam Pokhrel"}, {"prompt": "Samhalincha Kahile Maan", "ideal": "Sugam Pokhrel"}, {"prompt": "Ma ta dur dekhi", "ideal": "Deep Shrestha"}, {"prompt": "Badal haru", "ideal": "Deep Shrestha"}, {"prompt": "Halla Chalechha", "ideal": "Raju Lama"}, {"prompt": "Sayad Timro Bato Ma", "ideal": "Raju Lama"}, {"prompt": "Timi Lai Dekhera", "ideal": "Raju Lama"}, {"prompt": "Aaja maan udhera bhagchha", "ideal": "Udit Narayan"}, {"prompt": "Kaha Hola Ghar Bara", "ideal": "Karma"}, {"prompt": "Ko hau timi", "ideal": "Karma"}, {"prompt": "Khaseka Tara", "ideal": "Albatross"}, {"prompt": "Timi Bhane", "ideal": "Albatross"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-nepali-song-singer", "sourceHandle": "prompt", "target": "eval-nepali-song-singer", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-nepali-song-singer", "sourceHandle": "prompt", "target": "inspect-nepali-song-singer", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-nepali-song-singer", "sourceHandle": "output", "target": "vis-nepali-song-singer", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-nepali-song-singer", "sourceHandle": "Prompt", "target": "prompt-nepali-song-singer", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/passing-balls.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-passing-balls", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Imagine there are three players: player 1, 2, and 3. The players are passing a ball around. For a given starting player and passing sequence, determine the last player holding the ball. Output only the number of the player. Do not explain your reasoning.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Imagine there are three players: player 1, 2, and 3. The players are passing a ball around. For a given starting player and passing sequence, determine the last player holding the ball. Output only the number of the player. Do not explain your reasoning.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-passing-balls", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet txt = response.text;\n\tlet ideal = response.meta['Ideal'];\n\treturn ideal.includes(txt) || txt.includes(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-passing-balls", "type": "vis", "data": {"input": "eval-passing-balls"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-passing-balls", "type": "inspect", "data": {"input": "prompt-passing-balls"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-passing-balls", "type": "table", "data": {"rows": [{"prompt": "Starting player: 1. Passing sequence: 2", "ideal": "2"}, {"prompt": "Starting player: 1. Passing sequence: 23", "ideal": "3"}, {"prompt": "Starting player: 1. Passing sequence: 232", "ideal": "2"}, {"prompt": "Starting player: 1. Passing sequence: 2321", "ideal": "1"}, {"prompt": "Starting player: 1. Passing sequence: 23212", "ideal": "2"}, {"prompt": "Starting player: 1. Passing sequence: 232123", "ideal": "3"}, {"prompt": "Starting player: 1. Passing sequence: 231232", "ideal": "2"}, {"prompt": "Starting player: 1. Passing sequence: 2312321", "ideal": "1"}, {"prompt": "Starting player: 1. Passing sequence: 23123212", "ideal": "2"}, {"prompt": "Starting player: 1. Passing sequence: 231232123", "ideal": "3"}, {"prompt": "Starting player: 1. Passing sequence: 23123", "ideal": "3"}, {"prompt": "Starting player: 1. Passing sequence: 23123123", "ideal": "3"}, {"prompt": "Starting player: 1. Passing sequence: 23123123123", "ideal": "3"}, {"prompt": "Starting player: 1. Passing sequence: 23123123123123", "ideal": "3"}, {"prompt": "Starting player: 1. Passing sequence: 21231323121321", "ideal": "1"}, {"prompt": "Starting player: 1. Passing sequence: 23231323121312", "ideal": "2"}, {"prompt": "Starting player: 1. Passing sequence: 23123232132313", "ideal": "3"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-passing-balls", "sourceHandle": "prompt", "target": "eval-passing-balls", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-passing-balls", "sourceHandle": "prompt", "target": "inspect-passing-balls", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-passing-balls", "sourceHandle": "output", "target": "vis-passing-balls", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-passing-balls", "sourceHandle": "Prompt", "target": "prompt-passing-balls", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/polish-syllable-count.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-polish-syllable-count", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Trzeba policzy\u0107 sylaby w polskim wyrazie i odpowiedzie\u0107 tylko jedn\u0105 cyfr\u0105. Wpisz tylko numer i nic wi\u0119cej.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Trzeba policzy\u0107 sylaby w polskim wyrazie i odpowiedzie\u0107 tylko jedn\u0105 cyfr\u0105. Wpisz tylko numer i nic wi\u0119cej.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-polish-syllable-count", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-polish-syllable-count", "type": "vis", "data": {"input": "eval-polish-syllable-count"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-polish-syllable-count", "type": "inspect", "data": {"input": "prompt-polish-syllable-count"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-polish-syllable-count", "type": "table", "data": {"rows": [{"prompt": "Wyraz: miasto", "ideal": "2"}, {"prompt": "Wyraz: cieszy\u0107", "ideal": "2"}, {"prompt": "Wyraz: kwiatek", "ideal": "2"}, {"prompt": "Wyraz: piosenkarka", "ideal": "4"}, {"prompt": "Wyraz: dziewanna", "ideal": "3"}, {"prompt": "Wyraz: niedowiarek", "ideal": "4"}, {"prompt": "Wyraz: nienormalny", "ideal": "4"}, {"prompt": "Wyraz: zmia\u017cd\u017cy\u0107", "ideal": "2"}, {"prompt": "Wyraz: cierpienie", "ideal": "3"}, {"prompt": "Wyraz: Paulina", "ideal": "3"}, {"prompt": "Wyraz: przyja\u017a\u0144", "ideal": "2"}, {"prompt": "Wyraz: chrz\u0105szcz", "ideal": "1"}, {"prompt": "Wyraz: wszystkich", "ideal": "2"}, {"prompt": "Wyraz: wi\u0119kszo\u015b\u0107", "ideal": "2"}, {"prompt": "Wyraz: ciecierzycy", "ideal": "4"}, {"prompt": "Wyraz: fiord", "ideal": "1"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-polish-syllable-count", "sourceHandle": "prompt", "target": "eval-polish-syllable-count", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-polish-syllable-count", "sourceHandle": "prompt", "target": "inspect-polish-syllable-count", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-polish-syllable-count", "sourceHandle": "output", "target": "vis-polish-syllable-count", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-polish-syllable-count", "sourceHandle": "Prompt", "target": "prompt-polish-syllable-count", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/reverse-polish-notation.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-reverse-polish-notation", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Convert mathematical expression to reverse polish notation. Do not provide any explanation or commentary, output the result only.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Convert mathematical expression to reverse polish notation. Do not provide any explanation or commentary, output the result only.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-reverse-polish-notation", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-reverse-polish-notation", "type": "vis", "data": {"input": "eval-reverse-polish-notation"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-reverse-polish-notation", "type": "inspect", "data": {"input": "prompt-reverse-polish-notation"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-reverse-polish-notation", "type": "table", "data": {"rows": [{"prompt": "Mathematical expression: 1 + 1", "ideal": "1 1 +"}, {"prompt": "Mathematical expression: 2 * 4 + 8", "ideal": "2 4 * 8 +"}, {"prompt": "Mathematical expression: 2 * (4 + 8)", "ideal": "2 4 8 + *"}, {"prompt": "Mathematical expression: (1 + 2) * (3 * 4)", "ideal": "1 2 + 3 4 * *"}, {"prompt": "Mathematical expression: 1 + (2 - (3 + 4))", "ideal": "1 2 - 3 4 + +"}, {"prompt": "Mathematical expression: (3 + 5) * (7 - 2)", "ideal": "3 5 + 7 2 - *"}, {"prompt": "Mathematical expression: (1 + 2) * 4", "ideal": "1 2 + 4 *"}, {"prompt": "Mathematical expression: 0", "ideal": "0"}, {"prompt": "Mathematical expression: (1 + 2) * 5 + 7", "ideal": "1 2 + 5 * 7 +"}, {"prompt": "Mathematical expression: (10 + 6) * 3", "ideal": "10 6 + 3 *"}, {"prompt": "Mathematical expression: (2 / 8) * (5 - 6)", "ideal": "2 8 / 5 6 - *"}, {"prompt": "Mathematical expression: (x + y) * z", "ideal": "x y + z *"}, {"prompt": "Mathematical expression: 5 / (5 + y * x)", "ideal": "5 5 y x * + /"}, {"prompt": "Mathematical expression: 4 + (13 / 5)", "ideal": "4 13 5 / +"}, {"prompt": "Mathematical expression: 2^3", "ideal": "2 3 ^"}, {"prompt": "Mathematical expression: (3 + x * 8) / (1 + 3 * x)", "ideal": "3 x 8 * + 1 3 x * + /"}, {"prompt": "Mathematical expression: (y * 5 + 1) / (3 * x + 1)", "ideal": "y 5 * 1 + 3 x * 1 + /"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-reverse-polish-notation", "sourceHandle": "prompt", "target": "eval-reverse-polish-notation", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-reverse-polish-notation", "sourceHandle": "prompt", "target": "inspect-reverse-polish-notation", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-reverse-polish-notation", "sourceHandle": "output", "target": "vis-reverse-polish-notation", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-reverse-polish-notation", "sourceHandle": "Prompt", "target": "prompt-reverse-polish-notation", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/rock-climbing.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-rock-climbing", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "You are to answer each given question with a single non plural form word, all lowercase, and without punctuation.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "You are to answer each given question with a single non plural form word, all lowercase, and without punctuation.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-rock-climbing", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-rock-climbing", "type": "vis", "data": {"input": "eval-rock-climbing"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-rock-climbing", "type": "inspect", "data": {"input": "prompt-rock-climbing"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-rock-climbing", "type": "table", "data": {"rows": [{"prompt": "The name actually comes from the way your fingers hold it so this climbing hold describes a small but positive edge you can only fit the top pad of your fingers on.", "ideal": "crimp"}, {"prompt": "Normally describes a large, deep climbing hold that you can wrap your whole hand around.", "ideal": "jug"}, {"prompt": "Often large, round climbing holds that do not have a positive gradient. This means you can\u2019t close your fingers around them at all and your hand remains quite open.", "ideal": "sloper"}, {"prompt": "You must pull sideways on this climbing hold rather than downwards.  The place you put your fingers is on the side of the climbing hold which is facing away from you.", "ideal": "sidepull"}, {"prompt": "You must pull sideways on this climbing hold rather than downwards.  The place you put your fingers is on the side of the climbing hold which is facing towards you.", "ideal": "gaston"}, {"prompt": "You must pull upwards on this climbing hold rather than downwards.  The place you put your fingers is on the side of the climbing hold which is facing downwards.", "ideal": "undercling"}, {"prompt": "A climbing hold that requires your thumb to get in on the action as well. Often the squeezing action is what is required to grip and use this climbing hold.", "ideal": "pinch"}, {"prompt": "Rather than gripping a variation in angle on the wall, you are dealing with a climbing hold which is an actual hole that has been eroded in. This climbing hold comes in all shapes and sizes.", "ideal": "pocket"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-rock-climbing", "sourceHandle": "prompt", "target": "eval-rock-climbing", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-rock-climbing", "sourceHandle": "prompt", "target": "inspect-rock-climbing", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-rock-climbing", "sourceHandle": "output", "target": "vis-rock-climbing", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-rock-climbing", "sourceHandle": "Prompt", "target": "prompt-rock-climbing", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/russian-rhyme.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-russian-rhyme", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "For each pair of words, determine whether their Russian translations rhyme. If they do, output the pair of rhyming words in Russian. If not, output NONE.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "For each pair of words, determine whether their Russian translations rhyme. If they do, output the pair of rhyming words in Russian. If not, output NONE.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-russian-rhyme", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet txt = response.text;\n\tlet ideal = response.meta['Ideal'];\n\treturn ideal.includes(txt) || txt.includes(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-russian-rhyme", "type": "vis", "data": {"input": "eval-russian-rhyme"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-russian-rhyme", "type": "inspect", "data": {"input": "prompt-russian-rhyme"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-russian-rhyme", "type": "table", "data": {"rows": [{"prompt": "cannon, toy", "ideal": "\u043f\u0443\u0448\u043a\u0430, \u0438\u0433\u0440\u0443\u0448\u043a\u0430"}, {"prompt": "life, organism", "ideal": "\u0436\u0438\u0437\u043d\u044c, \u043e\u0440\u0433\u0430\u043d\u0438\u0437\u043c"}, {"prompt": "human, escape", "ideal": "\u0447\u0435\u043b\u043e\u0432\u0435\u043a, \u043f\u043e\u0431\u0435\u0433"}, {"prompt": "soul, ramson", "ideal": "\u0434\u0443\u0448\u0430, \u0447\u0435\u0440\u0435\u043c\u0448\u0430"}, {"prompt": "peace, marshmallow", "ideal": "\u043c\u0438\u0440, \u0437\u0435\u0444\u0438\u0440"}, {"prompt": "sky, turnip", "ideal": "\u043d\u0435\u0431\u043e, \u0440\u0435\u043f\u0430"}, {"prompt": "summer, coin", "ideal": "\u043b\u0435\u0442\u043e, \u043c\u043e\u043d\u0435\u0442\u0430"}, {"prompt": "smile, violin", "ideal": "\u0443\u043b\u044b\u0431\u043a\u0430, \u0441\u043a\u0440\u0438\u043f\u043a\u0430"}, {"prompt": "sun, shaking", "ideal": "NONE"}, {"prompt": "rain, snow", "ideal": "NONE"}, {"prompt": "house, street", "ideal": "NONE"}, {"prompt": "flower, tree", "ideal": "NONE"}, {"prompt": "car, train", "ideal": "NONE"}, {"prompt": "mountain, valley", "ideal": "NONE"}, {"prompt": "day, night", "ideal": "NONE"}, {"prompt": "book, pen", "ideal": "NONE"}, {"prompt": "apple, orange", "ideal": "NONE"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-russian-rhyme", "sourceHandle": "prompt", "target": "eval-russian-rhyme", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-russian-rhyme", "sourceHandle": "prompt", "target": "inspect-russian-rhyme", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-russian-rhyme", "sourceHandle": "output", "target": "vis-russian-rhyme", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-russian-rhyme", "sourceHandle": "Prompt", "target": "prompt-russian-rhyme", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/south-african-bands.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-south-african-bands", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "A user will give you a name of a South African band. Name the lead vocalist, if they use a stage name answer with that instead of real name. Restrict answers to name only, with no further explanations being necessary.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "A user will give you a name of a South African band. Name the lead vocalist, if they use a stage name answer with that instead of real name. Restrict answers to name only, with no further explanations being necessary.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-south-african-bands", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-south-african-bands", "type": "vis", "data": {"input": "eval-south-african-bands"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-south-african-bands", "type": "inspect", "data": {"input": "prompt-south-african-bands"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-south-african-bands", "type": "table", "data": {"rows": [{"prompt": "Watershed", "ideal": "Craig Hinds"}, {"prompt": "Ballyhoo", "ideal": "Derrick Dryan"}, {"prompt": "Hi-5", "ideal": "Niel Schoombee"}, {"prompt": "Jack Hammer", "ideal": "Piet Botha"}, {"prompt": "The Skylarks", "ideal": "Miriam Makeba"}, {"prompt": "Freshlyground", "ideal": "Zolani Mahola"}, {"prompt": "Savuka", "ideal": "Johnny Clegg"}, {"prompt": "Die Antwoord", "ideal": "Ninja"}, {"prompt": "Caf\u00e9 Society", "ideal": "Julia Jade Aston"}, {"prompt": "Beatenberg", "ideal": "Matthew Field"}, {"prompt": "The Kiffness", "ideal": "David Scott"}, {"prompt": "Mango Groove", "ideal": "Claire Johnston"}, {"prompt": "\u00c9Void", "ideal": "Erik Windrich"}, {"prompt": "The Bang", "ideal": "Joshua Gregg"}, {"prompt": "The Parlotones", "ideal": "Kahn Morbee"}, {"prompt": "Savuka", "ideal": "Johnny Clegg"}, {"prompt": "Henry Ate", "ideal": "Karma-Ann Swanepoel"}, {"prompt": "Lark", "ideal": "Inge Beckmann"}, {"prompt": "Boo!", "ideal": "Chris Chameleon"}, {"prompt": "Little Sister", "ideal": "Debbi Lonmon"}, {"prompt": "Prime Circle", "ideal": "Ross Learmonth"}, {"prompt": "Four Jacks and a Jill", "ideal": "Glenys Lynne"}, {"prompt": "Rabbitt", "ideal": "Trevor Rabin"}, {"prompt": "The Narrow", "ideal": "Hanu de Jong"}, {"prompt": "Just Jinjer", "ideal": "Ard Matthews"}, {"prompt": "Beast", "ideal": "Inge Beckmann"}, {"prompt": "Taxi Violence", "ideal": "George van der Spuy"}, {"prompt": "HONEYMOAN", "ideal": "Alison Rachel"}, {"prompt": "Fire Through the Window", "ideal": "Sinead Dennis"}, {"prompt": "Shortstraw", "ideal": "Alastair Thomas"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-south-african-bands", "sourceHandle": "prompt", "target": "eval-south-african-bands", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-south-african-bands", "sourceHandle": "prompt", "target": "inspect-south-african-bands", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-south-african-bands", "sourceHandle": "output", "target": "vis-south-african-bands", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-south-african-bands", "sourceHandle": "Prompt", "target": "prompt-south-african-bands", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/spanish_feminine_noun_masculine_article.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-spanish_feminine_noun_masculine_article", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "You will be given a singular feminine Spanish word. What article should come before this word \"La\" or \"El\"? Answer with either \"La\" or \"El\" only", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "You will be given a singular feminine Spanish word. What article should come before this word \"La\" or \"El\"? Answer with either \"La\" or \"El\" only", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-spanish_feminine_noun_masculine_article", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideals = JSON.parse(response.meta['Ideal']);\n\treturn ideals.some(i => response.text.startsWith(i));\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-spanish_feminine_noun_masculine_article", "type": "vis", "data": {"input": "eval-spanish_feminine_noun_masculine_article"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-spanish_feminine_noun_masculine_article", "type": "inspect", "data": {"input": "prompt-spanish_feminine_noun_masculine_article"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-spanish_feminine_noun_masculine_article", "type": "table", "data": {"rows": [{"prompt": "agua", "ideal": "[\"El\"]"}, {"prompt": "\u00e1guila", "ideal": "[\"El\"]"}, {"prompt": "ala", "ideal": "[\"El\"]"}, {"prompt": "alba", "ideal": "[\"El\"]"}, {"prompt": "alma", "ideal": "[\"El\"]"}, {"prompt": "ama de casa", "ideal": "[\"El\"]"}, {"prompt": "ancla", "ideal": "[\"El\"]"}, {"prompt": "arma", "ideal": "[\"El\"]"}, {"prompt": "arpa", "ideal": "[\"El\"]"}, {"prompt": "asma", "ideal": "[\"El\"]"}, {"prompt": "ave", "ideal": "[\"El\"]"}, {"prompt": "habla", "ideal": "[\"El\"]"}, {"prompt": "hacha", "ideal": "[\"El\"]"}, {"prompt": "hambre", "ideal": "[\"El\"]"}, {"prompt": "hampa", "ideal": "[\"El\"]"}, {"prompt": "hache", "ideal": "[\"La\"]"}, {"prompt": "a", "ideal": "[\"La\"]"}, {"prompt": "amapola", "ideal": "[\"La\"]"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-spanish_feminine_noun_masculine_article", "sourceHandle": "prompt", "target": "eval-spanish_feminine_noun_masculine_article", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-spanish_feminine_noun_masculine_article", "sourceHandle": "prompt", "target": "inspect-spanish_feminine_noun_masculine_article", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-spanish_feminine_noun_masculine_article", "sourceHandle": "output", "target": "vis-spanish_feminine_noun_masculine_article", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-spanish_feminine_noun_masculine_article", "sourceHandle": "Prompt", "target": "prompt-spanish_feminine_noun_masculine_article", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/syntax-check.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-syntax-check", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "You are an IDE plugin assistant. Determine the named programming language or framework based on the partial code snippet. Respond only with the name.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "You are an IDE plugin assistant. Determine the named programming language or framework based on the partial code snippet. Respond only with the name.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-syntax-check", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-syntax-check", "type": "vis", "data": {"input": "eval-syntax-check"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-syntax-check", "type": "inspect", "data": {"input": "prompt-syntax-check"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-syntax-check", "type": "table", "data": {"rows": [{"prompt": "const c=20;", "ideal": "JavaScript"}, {"prompt": "() => {}", "ideal": "JavaScript"}, {"prompt": "</script>", "ideal": "HTML"}, {"prompt": "puts [9,1]", "ideal": "Ruby"}, {"prompt": "ActionController::Base.render json: {data: @data}", "ideal": "Ruby on Rails"}, {"prompt": "(1..10).sum", "ideal": "Ruby"}, {"prompt": "const [items, setItems] = useState([])", "ideal": "React"}, {"prompt": "i in range(10)", "ideal": "Python"}, {"prompt": "sum [1..10]", "ideal": "Haskell"}, {"prompt": "map { $x += $_ } @a;", "ideal": "Perl"}, {"prompt": "import os", "ideal": "Python"}, {"prompt": "<h1>Welcome, {{ username|capitalize }}!</h1>", "ideal": "Jinja"}, {"prompt": "<style>", "ideal": "HTML"}, {"prompt": "push eax", "ideal": "Assembly"}, {"prompt": "store.dispatch({ type: 'ADD_TODO', text: 'Buy milk' });", "ideal": "Redux"}, {"prompt": "<DOCTYPE", "ideal": "HTML"}, {"prompt": "{{#if condition}}<h1>Log back in</h1>{{/if}}", "ideal": "Handlebars"}, {"prompt": "{% url 'myapp:view_name' arg1 arg2 %}", "ideal": "Djnago"}, {"prompt": "update : Msg -> Model -> (Model, Cmd Msg)", "ideal": "Elm"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-syntax-check", "sourceHandle": "prompt", "target": "eval-syntax-check", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-syntax-check", "sourceHandle": "prompt", "target": "inspect-syntax-check", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-syntax-check", "sourceHandle": "output", "target": "vis-syntax-check", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-syntax-check", "sourceHandle": "Prompt", "target": "prompt-syntax-check", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/oaievals/word_vector_over_reliance.cforge:
--------------------------------------------------------------------------------
1 | {"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-word_vector_over_reliance", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "You are a helpful assistant. Please choose the unique one word in given word set, just answer the chosen word with no transformation and no explanation.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "You are a helpful assistant. Please choose the unique one word in given word set, just answer the chosen word with no transformation and no explanation.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-word_vector_over_reliance", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-word_vector_over_reliance", "type": "vis", "data": {"input": "eval-word_vector_over_reliance"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-word_vector_over_reliance", "type": "inspect", "data": {"input": "prompt-word_vector_over_reliance"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-word_vector_over_reliance", "type": "table", "data": {"rows": [{"prompt": "one,0,ten.", "ideal": "0"}, {"prompt": "zoom,zoo,bike.", "ideal": "bike"}, {"prompt": "moon,fool,bike.", "ideal": "bike"}, {"prompt": "man,\u5973\u4eba,bike.", "ideal": "bike"}, {"prompt": "hair,fire,hire.", "ideal": "hair"}, {"prompt": "bee,fee,flower.", "ideal": "flower"}, {"prompt": "house,mouse,keyboard.", "ideal": "keyboard"}, {"prompt": "boom,room,human.", "ideal": "human"}, {"prompt": "fast,cast,least.", "ideal": "least"}, {"prompt": "one,\u4e8c,thousand.", "ideal": "\u4e8c"}, {"prompt": "five,give,5.", "ideal": "5"}, {"prompt": "bus,computer,business.", "ideal": "computer"}, {"prompt": "blue,glue,sky.", "ideal": "sky"}, {"prompt": "bean,beanie,sead.", "ideal": "sead"}, {"prompt": "zoo,foo,bike.", "ideal": "bike"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-word_vector_over_reliance", "sourceHandle": "prompt", "target": "eval-word_vector_over_reliance", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-word_vector_over_reliance", "sourceHandle": "prompt", "target": "inspect-word_vector_over_reliance", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-word_vector_over_reliance", "sourceHandle": "output", "target": "vis-word_vector_over_reliance", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-word_vector_over_reliance", "sourceHandle": "Prompt", "target": "prompt-word_vector_over_reliance", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}


--------------------------------------------------------------------------------
/chainforge/providers/__init__.py:
--------------------------------------------------------------------------------
1 | __all__ = ['CustomProviderProtocol', 'provider', 'ProviderRegistry']
2 | from .protocol import CustomProviderProtocol, provider, ProviderRegistry


--------------------------------------------------------------------------------
/chainforge/react-server/.eslintrc.js:
--------------------------------------------------------------------------------
 1 | module.exports = {
 2 |   ignorePatterns: [
 3 |     "node_modules/**",
 4 |     "build/**",
 5 |     "craco.config.js",
 6 |     "src/backend/pyodide/**",
 7 |     "src/backend/__test__/**",
 8 |   ],
 9 |   extends: [
10 |     "semistandard",
11 |     "plugin:react/recommended",
12 |     "plugin:prettier/recommended",
13 |     "plugin:@typescript-eslint/recommended",
14 |   ],
15 |   rules: {
16 |     semi: ["error", "always"],
17 |     camelcase: ["off"],
18 |     "react/prop-types": ["off"],
19 |     "@typescript-eslint/no-explicit-any": ["off"],
20 |     "@typescript-eslint/no-empty-function": ["off"],
21 |     "no-control-regex": ["off"],
22 |   },
23 | 
24 |   settings: {
25 |     react: {
26 |       createClass: "createReactClass", // Regex for Component Factory to use,
27 |       // default to "createReactClass"
28 |       pragma: "React", // Pragma to use, default to "React"
29 |       fragment: "Fragment", // Fragment to use (may be a property of <pragma>), default to "Fragment"
30 |       version: "detect", // React version. "detect" automatically picks the version you have installed.
31 |       // You can also use `16.0`, `16.3`, etc, if you want to override the detected value.
32 |       // It will default to "latest" and warn if missing, and to "detect" in the future
33 |       flowVersion: "0.53", // Flow version
34 |     },
35 |     propWrapperFunctions: [
36 |       // The names of any function used to wrap propTypes, e.g. `forbidExtraProps`. If this isn't set, any propTypes wrapped in a function will be skipped.
37 |       "forbidExtraProps",
38 |       { property: "freeze", object: "Object" },
39 |       { property: "myFavoriteWrapper" },
40 |       // for rules that check exact prop wrappers
41 |       { property: "forbidExtraProps", exact: true },
42 |     ],
43 |     componentWrapperFunctions: [
44 |       // The name of any function used to wrap components, e.g. Mobx `observer` function. If this isn't set, components wrapped by these functions will be skipped.
45 |       "observer", // `property`
46 |       { property: "styled" }, // `object` is optional
47 |       { property: "observer", object: "Mobx" },
48 |       { property: "observer", object: "<pragma>" }, // sets `object` to whatever value `settings.react.pragma` is set to
49 |     ],
50 |     formComponents: [
51 |       // Components used as alternatives to <form> for forms, eg. <Form endpoint={ url } />
52 |       "CustomForm",
53 |       { name: "Form", formAttribute: "endpoint" },
54 |     ],
55 |     linkComponents: [
56 |       // Components used as alternatives to <a> for linking, eg. <Link to={ url } />
57 |       "Hyperlink",
58 |       { name: "Link", linkAttribute: "to" },
59 |     ],
60 |   },
61 | };
62 | 


--------------------------------------------------------------------------------
/chainforge/react-server/.gitignore:
--------------------------------------------------------------------------------
  1 | # Created by https://www.toptal.com/developers/gitignore/api/node,react
  2 | # Edit at https://www.toptal.com/developers/gitignore?templates=node,react
  3 | 
  4 | # Ignore build folder
  5 | build/
  6 | 
  7 | ### Node ###
  8 | # Logs
  9 | logs
 10 | *.log
 11 | npm-debug.log*
 12 | yarn-debug.log*
 13 | yarn-error.log*
 14 | lerna-debug.log*
 15 | .pnpm-debug.log*
 16 | 
 17 | # Diagnostic reports (https://nodejs.org/api/report.html)
 18 | report.[0-9]*.[0-9]*.[0-9]*.[0-9]*.json
 19 | 
 20 | # Runtime data
 21 | pids
 22 | *.pid
 23 | *.seed
 24 | *.pid.lock
 25 | 
 26 | # Directory for instrumented libs generated by jscoverage/JSCover
 27 | lib-cov
 28 | 
 29 | # Coverage directory used by tools like istanbul
 30 | coverage
 31 | *.lcov
 32 | 
 33 | # nyc test coverage
 34 | .nyc_output
 35 | 
 36 | # Grunt intermediate storage (https://gruntjs.com/creating-plugins#storing-task-files)
 37 | .grunt
 38 | 
 39 | # Bower dependency directory (https://bower.io/)
 40 | bower_components
 41 | 
 42 | # node-waf configuration
 43 | .lock-wscript
 44 | 
 45 | # Compiled binary addons (https://nodejs.org/api/addons.html)
 46 | build/Release
 47 | 
 48 | # Dependency directories
 49 | node_modules/
 50 | jspm_packages/
 51 | 
 52 | # Snowpack dependency directory (https://snowpack.dev/)
 53 | web_modules/
 54 | 
 55 | # TypeScript cache
 56 | *.tsbuildinfo
 57 | 
 58 | # Optional npm cache directory
 59 | .npm
 60 | 
 61 | # Optional eslint cache
 62 | .eslintcache
 63 | 
 64 | # Optional stylelint cache
 65 | .stylelintcache
 66 | 
 67 | # Microbundle cache
 68 | .rpt2_cache/
 69 | .rts2_cache_cjs/
 70 | .rts2_cache_es/
 71 | .rts2_cache_umd/
 72 | 
 73 | # Optional REPL history
 74 | .node_repl_history
 75 | 
 76 | # Output of 'npm pack'
 77 | *.tgz
 78 | 
 79 | # Yarn Integrity file
 80 | .yarn-integrity
 81 | 
 82 | # dotenv environment variable files
 83 | .env
 84 | .env.development.local
 85 | .env.test.local
 86 | .env.production.local
 87 | .env.local
 88 | 
 89 | # parcel-bundler cache (https://parceljs.org/)
 90 | .cache
 91 | .parcel-cache
 92 | 
 93 | # Next.js build output
 94 | .next
 95 | out
 96 | 
 97 | # Nuxt.js build / generate output
 98 | .nuxt
 99 | dist
100 | 
101 | # Gatsby files
102 | .cache/
103 | # Comment in the public line in if your project uses Gatsby and not Next.js
104 | # https://nextjs.org/blog/next-9-1#public-directory-support
105 | # public
106 | 
107 | # vuepress build output
108 | .vuepress/dist
109 | 
110 | # vuepress v2.x temp and cache directory
111 | .temp
112 | 
113 | # Docusaurus cache and generated files
114 | .docusaurus
115 | 
116 | # Serverless directories
117 | .serverless/
118 | 
119 | # FuseBox cache
120 | .fusebox/
121 | 
122 | # DynamoDB Local files
123 | .dynamodb/
124 | 
125 | # TernJS port file
126 | .tern-port
127 | 
128 | # Stores VSCode versions used for testing VSCode extensions
129 | .vscode-test
130 | 
131 | # yarn v2
132 | .yarn/cache
133 | .yarn/unplugged
134 | .yarn/build-state.yml
135 | .yarn/install-state.gz
136 | .pnp.*
137 | 
138 | ### Node Patch ###
139 | # Serverless Webpack directories
140 | .webpack/
141 | 
142 | # Optional stylelint cache
143 | 
144 | # SvelteKit build / generate output
145 | .svelte-kit
146 | 
147 | ### react ###
148 | .DS_*
149 | **/*.backup.*
150 | **/*.back.*
151 | 
152 | node_modules
153 | 
154 | *.sublime*
155 | 
156 | psd
157 | thumb
158 | sketch
159 | 
160 | # End of https://www.toptal.com/developers/gitignore/api/node,react


--------------------------------------------------------------------------------
/chainforge/react-server/.nvmrc:
--------------------------------------------------------------------------------
1 | 20.5.1
2 | 


--------------------------------------------------------------------------------
/chainforge/react-server/.prettierignore:
--------------------------------------------------------------------------------
1 | # Ignore artifacts:
2 | build
3 | public
4 | **/*.html


--------------------------------------------------------------------------------
/chainforge/react-server/.prettierrc.json:
--------------------------------------------------------------------------------
1 | {
2 |   "trailingComma": "all",
3 |   "tabWidth": 2,
4 |   "semi": true,
5 |   "singleQuote": false
6 | }
7 | 


--------------------------------------------------------------------------------
/chainforge/react-server/README.md:
--------------------------------------------------------------------------------
 1 | # ChainForge React Server
 2 | 
 3 | This project was bootstrapped with [Create React App](https://github.com/facebook/create-react-app).
 4 | 
 5 | ## Available Scripts
 6 | 
 7 | In the project directory, you can run:
 8 | 
 9 | ### `npm start`
10 | 
11 | Runs the app in the development mode.\
12 | Open [http://localhost:3000](http://localhost:3000) to view it in your browser.
13 | 
14 | The page will reload when you make changes.\
15 | You may also see any lint errors in the console.
16 | 
17 | ### `npm test`
18 | 
19 | Launches the test runner in the interactive watch mode.\
20 | See the section about [running tests](https://facebook.github.io/create-react-app/docs/running-tests) for more information.
21 | 
22 | ### `npm run build`
23 | 
24 | Builds the app for production to the `build` folder.\
25 | It correctly bundles React in production mode and optimizes the build for the best performance.
26 | 
27 | The build is minified and the filenames include the hashes.\
28 | Your app is ready to be deployed!
29 | 
30 | See the section about [deployment](https://facebook.github.io/create-react-app/docs/deployment) for more information.
31 | 
32 | ### `npm run eject`
33 | 
34 | **Note: this is a one-way operation. Once you `eject`, you can't go back!**
35 | 
36 | If you aren't satisfied with the build tool and configuration choices, you can `eject` at any time. This command will remove the single build dependency from your project.
37 | 
38 | Instead, it will copy all the configuration files and the transitive dependencies (webpack, Babel, ESLint, etc) right into your project so you have full control over them. All of the commands except `eject` will still work, but they will point to the copied scripts so you can tweak them. At this point you're on your own.
39 | 
40 | You don't have to ever use `eject`. The curated feature set is suitable for small and middle deployments, and you shouldn't feel obligated to use this feature. However we understand that this tool wouldn't be useful if you couldn't customize it when you are ready for it.
41 | 
42 | ## Learn More
43 | 
44 | You can learn more in the [Create React App documentation](https://facebook.github.io/create-react-app/docs/getting-started).
45 | 
46 | To learn React, check out the [React documentation](https://reactjs.org/).
47 | 
48 | ### Code Splitting
49 | 
50 | This section has moved here: [https://facebook.github.io/create-react-app/docs/code-splitting](https://facebook.github.io/create-react-app/docs/code-splitting)
51 | 
52 | ### Analyzing the Bundle Size
53 | 
54 | This section has moved here: [https://facebook.github.io/create-react-app/docs/analyzing-the-bundle-size](https://facebook.github.io/create-react-app/docs/analyzing-the-bundle-size)
55 | 
56 | ### Making a Progressive Web App
57 | 
58 | This section has moved here: [https://facebook.github.io/create-react-app/docs/making-a-progressive-web-app](https://facebook.github.io/create-react-app/docs/making-a-progressive-web-app)
59 | 
60 | ### Advanced Configuration
61 | 
62 | This section has moved here: [https://facebook.github.io/create-react-app/docs/advanced-configuration](https://facebook.github.io/create-react-app/docs/advanced-configuration)
63 | 
64 | ### Deployment
65 | 
66 | This section has moved here: [https://facebook.github.io/create-react-app/docs/deployment](https://facebook.github.io/create-react-app/docs/deployment)
67 | 
68 | ### `npm run build` fails to minify
69 | 
70 | This section has moved here: [https://facebook.github.io/create-react-app/docs/troubleshooting#npm-run-build-fails-to-minify](https://facebook.github.io/create-react-app/docs/troubleshooting#npm-run-build-fails-to-minify)
71 | 


--------------------------------------------------------------------------------
/chainforge/react-server/craco.config.js:
--------------------------------------------------------------------------------
 1 | const webpack = require("webpack");
 2 | 
 3 | // const dotenv = require('dotenv').config({ path: __dirname + '/.env' })
 4 | const isDevelopment = process.env.NODE_ENV !== "production";
 5 | 
 6 | module.exports = {
 7 |   eslint: {
 8 |     enable: false,
 9 |   },
10 |   webpack: {
11 |     configure: {
12 |       resolve: {
13 |         fallback: {
14 |           process: require.resolve("process/browser"),
15 |           buffer: require.resolve("buffer"),
16 |           https: require.resolve("https-browserify"),
17 |           querystring: require.resolve("querystring-es3"),
18 |           url: require.resolve("url/"),
19 |           os: require.resolve("os-browserify/browser"),
20 |           stream: require.resolve("stream-browserify"),
21 |           path: require.resolve("path-browserify"),
22 |           util: require.resolve("util/"),
23 |           crypto: require.resolve("crypto-browserify"),
24 |           assert: require.resolve("assert/"),
25 |           http: require.resolve("stream-http"),
26 |           net: require.resolve("net-browserify"),
27 |           zlib: require.resolve("browserify-zlib"),
28 |           fs: false,
29 |           child_process: false,
30 |         },
31 |       },
32 |     },
33 | 
34 |     module: {
35 |       rules: [
36 |         {
37 |           test: /node_modules\/https-proxy-agent\//,
38 |           use: "null-loader",
39 |         },
40 |       ],
41 |     },
42 | 
43 |     plugins: {
44 |       add: [
45 |         new webpack.ProvidePlugin({
46 |           process: "process/browser.js",
47 |         }),
48 | 
49 |         // Work around for Buffer is undefined:
50 |         // https://github.com/webpack/changelog-v5/issues/10
51 |         new webpack.ProvidePlugin({
52 |           Buffer: ["buffer", "Buffer"],
53 |         }),
54 |       ],
55 |     },
56 | 
57 |     // plugins: {add: [
58 |     //   new webpack.DefinePlugin({
59 |     //     // 'process': "{}",
60 |     //     'process.env': "{}", // JSON.stringify(dotenv.parsed),
61 |     //     // 'process.env.NODE_ENV': JSON.stringify(isDevelopment ? 'development' : 'production'),
62 |     //   }),
63 |     // ]},
64 |   },
65 | };
66 | 


--------------------------------------------------------------------------------
/chainforge/react-server/package.json:
--------------------------------------------------------------------------------
  1 | {
  2 |   "name": "chain-forge",
  3 |   "version": "0.1.0",
  4 |   "private": true,
  5 |   "engines": {
  6 |     "node": "^20"
  7 |   },
  8 |   "dependencies": {
  9 |     "@anthropic-ai/sdk": "^0.4.4",
 10 |     "@azure/openai": "^1.0.0-beta.2",
 11 |     "@codemirror/lang-javascript": "^6.1.5",
 12 |     "@codemirror/lang-python": "^6.1.2",
 13 |     "@emoji-mart/data": "^1.1.2",
 14 |     "@emoji-mart/react": "^1.1.1",
 15 |     "@fontsource/geist-mono": "^5.0.1",
 16 |     "@google-ai/generativelanguage": "^0.2.0",
 17 |     "@google/generative-ai": "^0.21.0",
 18 |     "@mantine/core": "^6.0.9",
 19 |     "@mantine/dates": "^6.0.13",
 20 |     "@mantine/dropzone": "^6.0.19",
 21 |     "@mantine/form": "^6.0.11",
 22 |     "@mantine/prism": "^6.0.15",
 23 |     "@mirai73/bedrock-fm": "^0.4.10",
 24 |     "@reactflow/background": "^11.2.0",
 25 |     "@reactflow/controls": "^11.1.11",
 26 |     "@reactflow/core": "^11.7.0",
 27 |     "@reactflow/node-resizer": "^2.1.0",
 28 |     "@rjsf/core": "^5.7.3",
 29 |     "@rjsf/utils": "^5.7.3",
 30 |     "@rjsf/validator-ajv8": "^5.7.3",
 31 |     "@tabler/icons-react": "^2.47.0",
 32 |     "@testing-library/jest-dom": "^5.16.5",
 33 |     "@testing-library/react": "^13.4.0",
 34 |     "@testing-library/user-event": "^13.5.0",
 35 |     "@types/jest": "^29.5.2",
 36 |     "@types/node": "^20.3.2",
 37 |     "@types/react": "^18.2.14",
 38 |     "@types/react-dom": "^18.2.6",
 39 |     "@uiw/codemirror-theme-material": "^4.19.16",
 40 |     "@uiw/codemirror-theme-noctis-lilac": "^4.19.16",
 41 |     "@uiw/codemirror-theme-okaidia": "^4.19.16",
 42 |     "@uiw/codemirror-theme-solarized": "^4.19.16",
 43 |     "@uiw/codemirror-theme-sublime": "^4.19.16",
 44 |     "@uiw/codemirror-theme-xcode": "^4.19.16",
 45 |     "@uiw/codemirror-themes": "^4.19.16",
 46 |     "@uiw/react-codemirror": "^4.19.16",
 47 |     "ace-builds": "^1.18.0",
 48 |     "assert": "^2.0.0",
 49 |     "bootstrap": "^5.2.3",
 50 |     "bottleneck": "^2.19.5",
 51 |     "browserify-zlib": "^0.2.0",
 52 |     "buffer": "^6.0.3",
 53 |     "codemirror": "^6.0.1",
 54 |     "codemirror-readonly-ranges": "^0.1.0-alpha.1",
 55 |     "compressorjs": "^1.2.1",
 56 |     "crypto-browserify": "^3.12.0",
 57 |     "dayjs": "^1.11.8",
 58 |     "emoji-mart": "^5.5.2",
 59 |     "emoji-picker-react": "^4.4.9",
 60 |     "google-auth-library": "^8.8.0",
 61 |     "https-browserify": "^1.0.0",
 62 |     "jstat": "^1.9.6",
 63 |     "jszip": "^3.10.1",
 64 |     "lazysizes": "^5.3.2",
 65 |     "lodash": "^4.17.21",
 66 |     "lz-string": "^1.5.0",
 67 |     "mantine-contextmenu": "^6.1.0",
 68 |     "mantine-react-table": "^1.3.4",
 69 |     "markdown-it": "^13.0.1",
 70 |     "mathjs": "^11.8.2",
 71 |     "mdast-util-from-markdown": "^2.0.0",
 72 |     "net": "^1.0.2",
 73 |     "net-browserify": "^0.2.4",
 74 |     "node-fetch": "^2.6.11",
 75 |     "openai": "~3.3.0",
 76 |     "os-browserify": "^0.3.0",
 77 |     "papaparse": "^5.4.1",
 78 |     "path-browserify": "^1.0.1",
 79 |     "plotly.js": "^2.21.0",
 80 |     "process": "^0.11.10",
 81 |     "querystring-es3": "^0.2.1",
 82 |     "react": "^18.2.0",
 83 |     "react-ace": "^10.1.0",
 84 |     "react-beautiful-dnd": "^13.1.1",
 85 |     "react-confetti-explosion": "^2.1.2",
 86 |     "react-csv": "^2.2.2",
 87 |     "react-device-detect": "^2.2.3",
 88 |     "react-dom": "^18.2.0",
 89 |     "react-edit-text": "^5.1.0",
 90 |     "react-plotly.js": "^2.6.0",
 91 |     "react-scripts": "5.0.1",
 92 |     "reactflow": "^11.0",
 93 |     "request": "^2.88.2",
 94 |     "simple-statistics": "^7.8.7",
 95 |     "socket.io-client": "^4.6.1",
 96 |     "stream-browserify": "^3.0.0",
 97 |     "stream-http": "^3.2.0",
 98 |     "styled-components": "^5.3.10",
 99 |     "tls": "^0.0.1",
100 |     "typescript": "^5.1.3",
101 |     "url": "^0.11.1",
102 |     "util": "^0.12.5",
103 |     "uuidv4": "^6.2.13",
104 |     "web-vitals": "^2.1.4",
105 |     "xlsx": "^0.18.5",
106 |     "zustand": "^4.3.7"
107 |   },
108 |   "overrides": {
109 |     "typescript": "^5.1.3"
110 |   },
111 |   "scripts": {
112 |     "start": "npx prettier -w . && npx eslint . && craco start",
113 |     "build": "npx prettier -w . && npx eslint . && craco build",
114 |     "test": "npx prettier -w . && npx eslint . && craco test",
115 |     "eject": "react-scripts eject",
116 |     "clean": "npx prettier -w . && npx eslint ."
117 |   },
118 |   "eslintConfig": {
119 |     "extends": [
120 |       "react-app",
121 |       "react-app/jest"
122 |     ]
123 |   },
124 |   "browserslist": {
125 |     "production": [
126 |       ">0.2%",
127 |       "not dead",
128 |       "not op_mini all"
129 |     ],
130 |     "development": [
131 |       "last 1 chrome version",
132 |       "last 1 firefox version",
133 |       "last 1 safari version"
134 |     ]
135 |   },
136 |   "devDependencies": {
137 |     "@craco/craco": "^7.1.0",
138 |     "@types/lodash": "^4.17.0",
139 |     "@types/papaparse": "^5.3.14",
140 |     "@types/react-beautiful-dnd": "^13.1.8",
141 |     "@types/react-edit-text": "^5.0.4",
142 |     "@types/react-plotly.js": "^2.6.3",
143 |     "@types/styled-components": "^5.1.34",
144 |     "eslint": "<9.0.0",
145 |     "eslint-config-prettier": "^9.1.0",
146 |     "eslint-config-semistandard": "^17.0.0",
147 |     "eslint-config-standard": "^17.1.0",
148 |     "eslint-plugin-import": "^2.29.1",
149 |     "eslint-plugin-n": "^15.7.0",
150 |     "eslint-plugin-prettier": "^5.1.3",
151 |     "eslint-plugin-promise": "^6.1.1",
152 |     "eslint-plugin-react": "^7.33.2",
153 |     "jest": "^27.5.1",
154 |     "worker-loader": "^3.0.8"
155 |   }
156 | }
157 | 


--------------------------------------------------------------------------------
/chainforge/react-server/public/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ianarawjo/ChainForge/0b22ad4e0bc0a18c5675157b1c8ff4b6e57b410d/chainforge/react-server/public/favicon.ico


--------------------------------------------------------------------------------
/chainforge/react-server/public/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="en">
 3 |   <head>
 4 |     <meta charset="utf-8" />
 5 |     <!-- Google tag (gtag.js) -->
 6 |     <script
 7 |       async
 8 |       src="https://www.googletagmanager.com/gtag/js?id=G-RN3FDBLMCR"
 9 |     ></script>
10 |     <script>
11 |       window.dataLayer = window.dataLayer || [];
12 |       function gtag() {
13 |         dataLayer.push(arguments);
14 |       }
15 |       gtag("js", new Date());
16 | 
17 |       gtag("config", "G-RN3FDBLMCR");
18 |     </script>
19 |     <!-- Logo from bqlqn @ flaticon.com; used with attribution: https://www.flaticon.com/free-icon/link_1209950 -->
20 |     <link rel="icon" href="%PUBLIC_URL%/favicon.ico" />
21 |     <meta name="viewport" content="width=device-width, initial-scale=1" />
22 |     <meta name="theme-color" content="#000000" />
23 |     <meta
24 |       name="description"
25 |       content="A visual programming environment for prompt engineering"
26 |     />
27 |     <link rel="apple-touch-icon" href="%PUBLIC_URL%/logo192.png" />
28 |     <!--
29 |       manifest.json provides metadata used when your web app is installed on a
30 |       user's mobile device or desktop. See https://developers.google.com/web/fundamentals/web-app-manifest/
31 |     -->
32 |     <link rel="manifest" href="%PUBLIC_URL%/manifest.json" />
33 |     <!--
34 |       Notice the use of %PUBLIC_URL% in the tags above.
35 |       It will be replaced with the URL of the `public` folder during the build.
36 |       Only files inside the `public` folder can be referenced from the HTML.
37 | 
38 |       Unlike "/favicon.ico" or "favicon.ico", "%PUBLIC_URL%/favicon.ico" will
39 |       work correctly both with client-side routing and a non-root public URL.
40 |       Learn how to configure a non-root public URL by running `npm run build`.
41 |     -->
42 |     <title>ChainForge</title>
43 |   </head>
44 |   <body>
45 |     <noscript>You need to enable JavaScript to run this app.</noscript>
46 |     <div id="root"></div>
47 |     <!--
48 |       This HTML file is a template.
49 |       If you open it directly in the browser, you will see an empty page.
50 | 
51 |       You can add webfonts, meta tags, or analytics to this file.
52 |       The build step will place the bundled scripts into the <body> tag.
53 | 
54 |       To begin the development, run `npm start` or `yarn start`.
55 |       To create a production bundle, use `npm run build` or `yarn build`.
56 |     -->
57 |   </body>
58 | </html>
59 | 


--------------------------------------------------------------------------------
/chainforge/react-server/public/logo192.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ianarawjo/ChainForge/0b22ad4e0bc0a18c5675157b1c8ff4b6e57b410d/chainforge/react-server/public/logo192.png


--------------------------------------------------------------------------------
/chainforge/react-server/public/logo512.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ianarawjo/ChainForge/0b22ad4e0bc0a18c5675157b1c8ff4b6e57b410d/chainforge/react-server/public/logo512.png


--------------------------------------------------------------------------------
/chainforge/react-server/public/manifest.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "short_name": "ChainForge",
 3 |   "name": "ChainForge",
 4 |   "icons": [
 5 |     {
 6 |       "src": "favicon.ico",
 7 |       "sizes": "64x64 32x32 24x24 16x16",
 8 |       "type": "image/x-icon"
 9 |     },
10 |     {
11 |       "src": "logo192.png",
12 |       "type": "image/png",
13 |       "sizes": "192x192"
14 |     },
15 |     {
16 |       "src": "logo512.png",
17 |       "type": "image/png",
18 |       "sizes": "512x512"
19 |     }
20 |   ],
21 |   "start_url": ".",
22 |   "display": "standalone",
23 |   "theme_color": "#000000",
24 |   "background_color": "#ffffff"
25 | }
26 | 


--------------------------------------------------------------------------------
/chainforge/react-server/public/robots.txt:
--------------------------------------------------------------------------------
1 | # https://www.robotstxt.org/robotstxt.html
2 | User-agent: *
3 | Disallow:
4 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/AlertModal.tsx:
--------------------------------------------------------------------------------
 1 | /** An alert popup for displaying errors */
 2 | import React, {
 3 |   useState,
 4 |   forwardRef,
 5 |   useImperativeHandle,
 6 |   createContext,
 7 |   useRef,
 8 |   useMemo,
 9 | } from "react";
10 | import { useDisclosure } from "@mantine/hooks";
11 | import { Modal, ModalBaseStylesNames, Styles } from "@mantine/core";
12 | 
13 | const ALERT_MODAL_STYLE = {
14 |   header: { backgroundColor: "#E52A2A", color: "white" },
15 | } as Styles<ModalBaseStylesNames>;
16 | 
17 | export interface AlertModalRef {
18 |   trigger: (msg?: string | Error) => void;
19 | }
20 | 
21 | /**
22 |  * The Alert Modal displays error messages to the user in a pop-up dialog.
23 |  */
24 | export const AlertModal = forwardRef<AlertModalRef>(
25 |   function AlertModal(props, ref) {
26 |     // Mantine modal popover for alerts
27 |     const [opened, { open, close }] = useDisclosure(false);
28 |     const [alertMsg, setAlertMsg] = useState("");
29 | 
30 |     // This gives the parent access to triggering the modal alert
31 |     const trigger = (msg?: string | Error) => {
32 |       if (!msg) msg = "Unknown error.";
33 |       else if (typeof msg !== "string") msg = msg.message;
34 |       console.error(msg);
35 |       setAlertMsg(msg);
36 |       open();
37 |     };
38 |     useImperativeHandle(ref, () => ({
39 |       trigger,
40 |     }));
41 | 
42 |     return (
43 |       <Modal
44 |         opened={opened}
45 |         onClose={close}
46 |         title="Error"
47 |         styles={ALERT_MODAL_STYLE}
48 |       >
49 |         <p style={{ whiteSpace: "pre-line" }}>{alertMsg}</p>
50 |       </Modal>
51 |     );
52 |   },
53 | );
54 | export default AlertModal;
55 | 
56 | export const AlertModalContext = createContext<
57 |   ((msg?: string | Error) => void) | undefined
58 | >(undefined);
59 | 
60 | /**
61 |  * Wraps children components to provide the same AlertModal to everywhere in the component tree.
62 |  * Saves space and reduces duplicate declarations.
63 |  */
64 | export const AlertModalProvider = ({
65 |   children,
66 | }: {
67 |   children: React.ReactNode[];
68 | }) => {
69 |   // Create one AlertModal for the entire application
70 |   const alertModal = useRef<AlertModalRef>(null);
71 | 
72 |   // We have to wrap trigger() in a memoized function, as passing it down directly will trigger re-renders every frame.
73 |   const showAlert = useMemo(() => {
74 |     return (msg?: string | Error) => alertModal?.current?.trigger(msg);
75 |   }, [alertModal]);
76 | 
77 |   return (
78 |     <AlertModalContext.Provider value={showAlert}>
79 |       <AlertModal ref={alertModal} />
80 |       {children}
81 |     </AlertModalContext.Provider>
82 |   );
83 | };
84 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/App.css:
--------------------------------------------------------------------------------
 1 | .App {
 2 |   text-align: center;
 3 | }
 4 | 
 5 | .App-logo {
 6 |   height: 40vmin;
 7 |   pointer-events: none;
 8 | }
 9 | 
10 | path.react-flow__edge-path {
11 |   stroke-width: 4;
12 | }
13 | 
14 | path.react-flow__edge-path:hover {
15 |   stroke-width: 10;
16 |   color: red;
17 | }
18 | 
19 | @media (prefers-reduced-motion: no-preference) {
20 |   .App-logo {
21 |     animation: App-logo-spin infinite 20s linear;
22 |   }
23 | }
24 | 
25 | .App-header {
26 |   background-color: #282c34;
27 |   min-height: 100vh;
28 |   display: flex;
29 |   flex-direction: column;
30 |   align-items: center;
31 |   justify-content: center;
32 |   font-size: calc(10px + 2vmin);
33 |   color: white;
34 | }
35 | 
36 | .App-link {
37 |   color: #61dafb;
38 | }
39 | 
40 | @keyframes App-logo-spin {
41 |   from {
42 |     transform: rotate(0deg);
43 |   }
44 |   to {
45 |     transform: rotate(360deg);
46 |   }
47 | }
48 | 
49 | .rich-editor {
50 |   min-width: 500px;
51 |   min-height: 500px;
52 | }
53 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/AreYouSureModal.tsx:
--------------------------------------------------------------------------------
 1 | import React, { forwardRef, useImperativeHandle } from "react";
 2 | import { Modal, Button, Box, Text, Flex } from "@mantine/core";
 3 | import { useDisclosure } from "@mantine/hooks";
 4 | 
 5 | export interface AreYouSureModalProps {
 6 |   title: string;
 7 |   message: string;
 8 |   color?: string;
 9 |   onConfirm?: () => void;
10 | }
11 | 
12 | export interface AreYouSureModalRef {
13 |   trigger: () => void;
14 | }
15 | 
16 | /** Modal that lets user rename a single value, using a TextInput field. */
17 | const AreYouSureModal = forwardRef<AreYouSureModalRef, AreYouSureModalProps>(
18 |   function AreYouSureModal({ title, message, color, onConfirm }, ref) {
19 |     const [opened, { open, close }] = useDisclosure(false);
20 |     const description = message || "Are you sure?";
21 | 
22 |     // This gives the parent access to triggering the modal alert
23 |     const trigger = () => {
24 |       open();
25 |     };
26 |     useImperativeHandle(ref, () => ({
27 |       trigger,
28 |     }));
29 | 
30 |     const confirmAndClose = () => {
31 |       close();
32 |       if (onConfirm) onConfirm();
33 |     };
34 | 
35 |     return (
36 |       <Modal
37 |         opened={opened}
38 |         onClose={close}
39 |         title={title}
40 |         styles={{
41 |           header: { backgroundColor: color ?? "orange", color: "white" },
42 |         }}
43 |       >
44 |         <Box maw={400} mx="auto" mt="md" mb="md">
45 |           <Text>{description}</Text>
46 |         </Box>
47 |         <Flex
48 |           mih={50}
49 |           gap="md"
50 |           justify="space-evenly"
51 |           align="center"
52 |           direction="row"
53 |           wrap="wrap"
54 |         >
55 |           <Button
56 |             variant="light"
57 |             color={color ?? "orange"}
58 |             type="submit"
59 |             w="40%"
60 |             onClick={close}
61 |           >
62 |             Cancel
63 |           </Button>
64 |           <Button
65 |             variant="filled"
66 |             color="blue"
67 |             type="submit"
68 |             w="40%"
69 |             onClick={confirmAndClose}
70 |           >
71 |             Confirm
72 |           </Button>
73 |         </Flex>
74 |       </Modal>
75 |     );
76 |   },
77 | );
78 | 
79 | export default AreYouSureModal;
80 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/ChatHistoryView.tsx:
--------------------------------------------------------------------------------
 1 | import React, { forwardRef } from "react";
 2 | 
 3 | export interface ChatHistoryViewProps {
 4 |   messages: React.ReactNode[];
 5 |   bgColors?: string[];
 6 | }
 7 | 
 8 | const ChatHistoryView = forwardRef<HTMLDivElement, ChatHistoryViewProps>(
 9 |   function ChatHistoryView({ messages, bgColors }, ref) {
10 |     const _bg_color = bgColors !== undefined ? bgColors : ["#333", "#333"];
11 |     return (
12 |       <div ref={ref} className="chat-history">
13 |         {messages.map((msg, idx) => (
14 |           <div
15 |             key={idx}
16 |             className={
17 |               "chat-bubble chat-msg-" + (idx % 2 === 0 ? "left" : "right")
18 |             }
19 |             style={{ backgroundColor: _bg_color[idx % 2] }}
20 |           >
21 |             {msg}
22 |           </div>
23 |         ))}
24 |       </div>
25 |     );
26 |   },
27 | );
28 | 
29 | export default ChatHistoryView;
30 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/ColorThemeProvider.tsx:
--------------------------------------------------------------------------------
 1 | import React, { useEffect } from "react";
 2 | import { useLocalStorage } from "@mantine/hooks";
 3 | import {
 4 |   ColorScheme,
 5 |   ColorSchemeProvider,
 6 |   useMantineColorScheme,
 7 |   MantineProvider,
 8 |   Group,
 9 |   Switch,
10 | } from "@mantine/core";
11 | import { IconMoon, IconSunHigh } from "@tabler/icons-react";
12 | 
13 | /**
14 |  * Tries to detect the user's OS color scheme preference.
15 |  * If the browser does not support the `prefers-color-scheme` media query,
16 |  * it will return `undefined`.
17 |  */
18 | function getOSPreferredColorScheme(): "dark" | "light" | undefined {
19 |   if (
20 |     window !== undefined &&
21 |     window.matchMedia &&
22 |     window.matchMedia("(prefers-color-scheme)").media !== "not all"
23 |   ) {
24 |     const prefersDark = window.matchMedia(
25 |       "(prefers-color-scheme: dark)",
26 |     ).matches;
27 |     return prefersDark ? "dark" : "light";
28 |   } else {
29 |     console.log("prefers-color-scheme not supported");
30 |     return undefined;
31 |   }
32 | }
33 | 
34 | export default function ColorThemeProvider({
35 |   children,
36 | }: {
37 |   children: React.ReactNode;
38 | }) {
39 |   const [colorScheme, setColorScheme] = useLocalStorage<ColorScheme>({
40 |     key: "mantine-color-scheme",
41 |     defaultValue: getOSPreferredColorScheme() ?? "light",
42 |     getInitialValueInEffect: true,
43 |   });
44 | 
45 |   const toggleColorScheme = (value?: ColorScheme) =>
46 |     setColorScheme(value || (colorScheme === "dark" ? "light" : "dark"));
47 | 
48 |   // Set data-mantine-color-scheme manually
49 |   // NOTE: This is a workaround for the issue where MantineProvider in Mantine 6 does not set the attribute on the html element.
50 |   // When we upgrade to Mantine 7, we can remove this useEffect and will need to change more code most likely.
51 |   useEffect(() => {
52 |     document.documentElement.setAttribute(
53 |       "data-mantine-color-scheme",
54 |       colorScheme,
55 |     );
56 |   }, [colorScheme]);
57 | 
58 |   return (
59 |     <ColorSchemeProvider
60 |       colorScheme={colorScheme}
61 |       toggleColorScheme={toggleColorScheme}
62 |     >
63 |       <MantineProvider
64 |         withGlobalStyles
65 |         withNormalizeCSS
66 |         theme={{ colorScheme }}
67 |       >
68 |         {children}
69 |       </MantineProvider>
70 |     </ColorSchemeProvider>
71 |   );
72 | }
73 | 
74 | export function ColorSchemeToggle() {
75 |   const { colorScheme, toggleColorScheme } = useMantineColorScheme();
76 |   const dark = colorScheme === "dark";
77 | 
78 |   return (
79 |     <Group position="center">
80 |       <Switch
81 |         description="Color theme"
82 |         checked={dark}
83 |         onChange={() => toggleColorScheme()}
84 |         color="gray"
85 |         size="md"
86 |         onLabel={<IconMoon size={16} style={{ color: "cyan" }} />}
87 |         offLabel={<IconSunHigh size={16} style={{ color: "OrangeRed" }} />}
88 |       />
89 |     </Group>
90 |   );
91 | }
92 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/CommentNode.tsx:
--------------------------------------------------------------------------------
 1 | import React, { useState } from "react";
 2 | import useStore from "./store";
 3 | import NodeLabel from "./NodeLabelComponent";
 4 | import BaseNode from "./BaseNode";
 5 | import { Textarea } from "@mantine/core";
 6 | 
 7 | export interface CommentNodeProps {
 8 |   data: {
 9 |     text: string;
10 |     title: string;
11 |   };
12 |   id: string;
13 | }
14 | 
15 | /**
16 |  * A node without any inputs or outputs that
17 |  * lets users write comment about their flow.
18 |  */
19 | const CommentNode: React.FC<CommentNodeProps> = ({ data, id }) => {
20 |   const [value, setValue] = useState(data.text || "");
21 |   const setDataPropsForNode = useStore((state) => state.setDataPropsForNode);
22 | 
23 |   const handleChangeComment = (evt: React.ChangeEvent<HTMLTextAreaElement>) => {
24 |     const txt = evt.currentTarget.value;
25 |     setValue(txt);
26 |     setDataPropsForNode(id, { text: txt });
27 |   };
28 | 
29 |   return (
30 |     <BaseNode classNames="comment-node" nodeId={id}>
31 |       <NodeLabel title={data.title || "Comment"} nodeId={id} icon={"✏️"} />
32 |       <Textarea
33 |         value={value}
34 |         onChange={handleChangeComment}
35 |         placeholder="I love ChainForge!"
36 |         className="nodrag"
37 |         autosize
38 |         w={"260px"}
39 |         minRows={2}
40 |         styles={{ input: { border: "none", backgroundColor: "#eee" } }}
41 |       />
42 |     </BaseNode>
43 |   );
44 | };
45 | 
46 | export default CommentNode;
47 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/EvalGen/ReportCardStep.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useMemo } from "react";
  2 | import {
  3 |   Button,
  4 |   Card,
  5 |   Flex,
  6 |   Group,
  7 |   ScrollArea,
  8 |   SimpleGrid,
  9 |   Stack,
 10 |   Text,
 11 | } from "@mantine/core";
 12 | import { EvalCriteria, EvalFunctionSetReport } from "../backend/evalgen/typing";
 13 | import { CriteriaCard } from "./PickCriteriaStep";
 14 | 
 15 | interface ReportCardStepProps {
 16 |   criteria: EvalCriteria[];
 17 |   report: EvalFunctionSetReport | null;
 18 |   onFinish: (reports: EvalFunctionSetReport) => void;
 19 |   onPrevious: () => void;
 20 |   setOnNextCallback: React.Dispatch<React.SetStateAction<() => unknown>>;
 21 | }
 22 | 
 23 | const ReportCardStep: React.FC<ReportCardStepProps> = ({
 24 |   report,
 25 |   onFinish,
 26 |   onPrevious,
 27 | }) => {
 28 |   const cards = useMemo(() => {
 29 |     if (!report) return null;
 30 |     const cards = [];
 31 | 
 32 |     // Iterate through selected eval functions and create cards
 33 |     for (const selectedFunc of report.selectedEvalFunctions) {
 34 |       const c = selectedFunc.evalCriteria;
 35 |       // Find corresponding report in allEvalFunctionReports map from criteria to list
 36 |       const evalFuncReports = report.allEvalFunctionReports.get(c);
 37 |       const evalFuncReport = evalFuncReports?.find(
 38 |         (rep) => rep.evalFunction === selectedFunc,
 39 |       );
 40 |       // Get the functions that were not selected for this criteria
 41 |       const otherFuncs = evalFuncReports?.filter(
 42 |         (rep) => rep.evalFunction !== selectedFunc,
 43 |       );
 44 | 
 45 |       cards.push(
 46 |         <CriteriaCard
 47 |           reportMode
 48 |           title={c.shortname}
 49 |           description={c.criteria}
 50 |           evalMethod={c.eval_method}
 51 |           key={c.uid}
 52 |           evalFuncReport={evalFuncReport}
 53 |           otherFuncs={otherFuncs}
 54 |         />,
 55 |       );
 56 |     }
 57 |     return cards;
 58 |   }, [report]);
 59 | 
 60 |   console.log(report);
 61 | 
 62 |   return (
 63 |     <Stack spacing="lg">
 64 |       <Text align="center" size="lg" pl="sm" mb="lg">
 65 |         Chosen Functions and Alignment
 66 |       </Text>
 67 | 
 68 |       {/* Show coverage and false failure rate numbers */}
 69 |       <Flex justify="center" gap="md" mb="lg">
 70 |         <Group position="center" spacing="xl" style={{ textAlign: "center" }}>
 71 |           <Card
 72 |             shadow="sm"
 73 |             padding="md"
 74 |             radius="md"
 75 |             style={{ backgroundColor: "#f0f0f0" }}
 76 |           >
 77 |             <Text weight={500} size="md">
 78 |               Coverage of Bad Responses
 79 |             </Text>
 80 |             <Text color="blue" weight={700} size="md">
 81 |               {report?.failureCoverage.toFixed(2)}%
 82 |             </Text>
 83 |           </Card>
 84 |           <Card
 85 |             shadow="sm"
 86 |             padding="md"
 87 |             radius="md"
 88 |             style={{ backgroundColor: "#f0f0f0" }}
 89 |           >
 90 |             <Text weight={500} size="md">
 91 |               False Failure Rate
 92 |             </Text>
 93 |             <Text color="red" weight={700} size="md">
 94 |               {report?.falseFailureRate.toFixed(2)}%
 95 |             </Text>
 96 |           </Card>
 97 |         </Group>
 98 |       </Flex>
 99 | 
100 |       <ScrollArea mih={300} h={400} mah={400}>
101 |         <SimpleGrid cols={3} spacing="sm" verticalSpacing="sm" mb="lg">
102 |           {cards}
103 |         </SimpleGrid>
104 |       </ScrollArea>
105 | 
106 |       <Flex justify="center" gap={12} mt="xs">
107 |         <Button
108 |           onClick={() => {
109 |             if (!report) return;
110 |             onFinish(report);
111 |           }}
112 |         >
113 |           Finish with selected evaluators
114 |         </Button>
115 |       </Flex>
116 |     </Stack>
117 |   );
118 | };
119 | 
120 | export default ReportCardStep;
121 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/EvalGen/WelcomeStep.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { Anchor, Button, List, Stack, Text, Title } from "@mantine/core";
 3 | 
 4 | interface WelcomeStepProps {
 5 |   setOnNextCallback: React.Dispatch<React.SetStateAction<() => unknown>>;
 6 | }
 7 | 
 8 | const WelcomeStep: React.FC<WelcomeStepProps> = ({ setOnNextCallback }) => (
 9 |   <Stack spacing="md" m="lg" p="lg" mb={120}>
10 |     <Title order={2}>Welcome to the EvalGen Wizard</Title>
11 |     <Text>
12 |       This wizard will guide you through creating automated evaluators for LLM
13 |       responses that are aligned with your preferences. You&apos;ll look at
14 |       data, define what you care about, apply those criteria to grade data, and
15 |       refine your criteria as you see more outputs. EvalGen then generates
16 |       automated evaluators that implement each criteria, chooses implementations
17 |       most aligned with your grades, and reports how aligned they are.
18 |     </Text>
19 |     <Text>
20 |       EvalGen is backed up by our{" "}
21 |       <Anchor
22 |         href="https://dl.acm.org/doi/abs/10.1145/3654777.3676450"
23 |         target="_blank"
24 |       >
25 |         empirical research at UIST 2024
26 |       </Anchor>
27 |       , and is inspired by inductive processes in UX research (heuristic
28 |       evaluation and grounded theory).
29 |     </Text>
30 |     <Text>Currently, Evalgen is in a public beta. It:</Text>
31 |     <List>
32 |       <List.Item>
33 |         Only generates <b>assertions (pass/fail tests)</b>. Numeric and
34 |         categorical evaluators are not included.
35 |       </List.Item>
36 |       <List.Item>
37 |         Asks for grades on a <b>per-criteria</b> basis on the main grading
38 |         screen. This is the chief difference from our paper.
39 |       </List.Item>
40 |       <List.Item>
41 |         Requires access to the GenAI features of ChainForge, which (currently)
42 |         requires an OpenAI API key. (If you&apos;d like to use other models,
43 |         more general access to GenAI features is coming soon.)
44 |       </List.Item>
45 |       <List.Item>
46 |         Should be run on the outputs of <b>already-run</b> Prompt Nodes
47 |         (you&apos;ve already collected some LLM responses).
48 |       </List.Item>
49 |       <List.Item>EvalGen will send off many requests during usage.</List.Item>
50 |     </List>
51 |     <Text>
52 |       🔔 <b>By using Evalgen, you take full responsibility for credit usage.</b>{" "}
53 |       Currently, EvalGen does NOT:
54 |     </Text>
55 |     <List>
56 |       <List.Item>
57 |         Work on imported spreadsheets of data (although if you are interested in
58 |         this, raise a Pull Request).
59 |       </List.Item>
60 |       <List.Item>
61 |         Generate code that uses third-party libraries. For safety, LLM-generated
62 |         Python code is run sandboxed in the browser with pyodide. Pyodide does
63 |         not have access to many libraries out-of-the-box. (If your eval criteria
64 |         implementation must use a third-party library, we suggest you use
65 |         ChainForge&apos;s genAI features on an individual code eval node,
66 |         outside this wizard.)
67 |       </List.Item>
68 |     </List>
69 |     {/* <Text>We have captured the following about your context:</Text>
70 |     <ul>
71 |       <li>…</li>
72 |       <li>[x] Use this info when helping me think of evaluation criteria</li>
73 |     </ul> */}
74 |     <Text>
75 |       After EvalGen finishes, the chosen evaluators appear in the MultiEval
76 |       node.
77 |     </Text>
78 |     <Text>
79 |       EvalGen is in beta. To improve it, provide feedback on our Github Issues
80 |       or Discussion pages, or raise a Pull Request with the changes.
81 |     </Text>
82 |   </Stack>
83 | );
84 | 
85 | export default WelcomeStep;
86 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/ImagePreviewModal.tsx:
--------------------------------------------------------------------------------
  1 | import React, {
  2 |   forwardRef,
  3 |   useImperativeHandle,
  4 |   useState,
  5 |   useEffect,
  6 | } from "react";
  7 | import { Modal, Image, Text, Stack } from "@mantine/core";
  8 | import { Dict } from "./backend/typing";
  9 | import { metadataRowType } from "./MediaNode";
 10 | 
 11 | export interface ImagePreviewModalRef {
 12 |   trigger: (url: string, data: metadataRowType) => void;
 13 | }
 14 | 
 15 | interface ImagePreviewModalProps {
 16 |   title?: string;
 17 | }
 18 | 
 19 | interface ImageInfo {
 20 |   user_source: string;
 21 |   width: number;
 22 |   height: number;
 23 |   format: string;
 24 |   size: string;
 25 |   timestamp: string;
 26 |   token_count?: Dict<string>;
 27 | }
 28 | 
 29 | const ImagePreviewModal = forwardRef<
 30 |   ImagePreviewModalRef,
 31 |   ImagePreviewModalProps
 32 | >(({ title = "Image Details Info" }, ref) => {
 33 |   const [opened, setOpened] = useState(false);
 34 |   const [imageUrl, setImageUrl] = useState("");
 35 |   const [imageData, setImageData] = useState<metadataRowType>(
 36 |     {} as metadataRowType,
 37 |   );
 38 |   const [imageInfo, setImageInfo] = useState<ImageInfo | null>(null);
 39 | 
 40 |   useImperativeHandle(ref, () => ({
 41 |     trigger: (url: string, data: metadataRowType) => {
 42 |       console.log("trigger", data);
 43 |       setImageUrl(url);
 44 |       setImageData(data);
 45 |       setOpened(true);
 46 |     },
 47 |   }));
 48 | 
 49 |   useEffect(() => {
 50 |     if (imageUrl) {
 51 |       const img = document.createElement("img");
 52 |       img.onload = () => {
 53 |         setImageInfo({
 54 |           user_source: imageData?.source,
 55 |           width: img.naturalWidth,
 56 |           height: img.naturalHeight,
 57 |           format: imageData?.coming_from,
 58 |           size: imageData?.size,
 59 |           timestamp: new Date(parseInt(imageData?.timestamp) * 1000).toString(),
 60 |         });
 61 |       };
 62 |       img.src = imageUrl;
 63 |     }
 64 |   }, [imageUrl, imageData]);
 65 | 
 66 |   return (
 67 |     <Modal
 68 |       opened={opened}
 69 |       onClose={() => setOpened(false)}
 70 |       title={title}
 71 |       size="xl"
 72 |     >
 73 |       <Stack spacing="md" align="center">
 74 |         <div
 75 |           style={{
 76 |             width: "100%",
 77 |             overflow: "hidden",
 78 |             display: "flex",
 79 |             alignItems: "center",
 80 |             justifyContent: "center",
 81 |           }}
 82 |         >
 83 |           <Image
 84 |             src={imageUrl}
 85 |             fit="contain"
 86 |             style={{
 87 |               maxWidth: "100%",
 88 |               maxHeight: "100%",
 89 |               objectFit: "contain",
 90 |             }}
 91 |           />
 92 |         </div>
 93 |         {imageInfo && (
 94 |           <div
 95 |             style={{
 96 |               width: "100%",
 97 |               padding: "10px",
 98 |               borderRadius: "8px",
 99 |               border: "1px solid #e9ecef",
100 |             }}
101 |           >
102 |             <Text size="sm" style={{ lineHeight: 1.7 }}>
103 |               <strong>Format:</strong> {imageInfo.format}
104 |               <br />
105 |               <strong>Timestamp:</strong> {imageInfo.timestamp}
106 |               <br />
107 |               <strong>Source:</strong> {imageInfo.user_source}
108 |               <br />
109 |               <hr style={{ margin: "10px 0" }} />
110 |               <strong>Width:</strong> {imageInfo.width} px
111 |               <br />
112 |               <strong>Height:</strong> {imageInfo.height} px
113 |               <br />
114 |               <strong>Size:</strong> {imageInfo.size} bytes
115 |               <br />
116 |               {/* TODO: Token Count: 'TODO Feature coming' */}
117 |             </Text>
118 |           </div>
119 |         )}
120 |       </Stack>
121 |     </Modal>
122 |   );
123 | });
124 | 
125 | ImagePreviewModal.displayName = "ImagePreviewModal";
126 | 
127 | export default ImagePreviewModal;
128 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/InspectFooter.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useMemo } from "react";
  2 | import { Button, Tooltip } from "@mantine/core";
  3 | import {
  4 |   IconSearch,
  5 |   IconSquareArrowLeft,
  6 |   IconSquareArrowRight,
  7 | } from "@tabler/icons-react";
  8 | 
  9 | export interface InspectFooterProps {
 10 |   onClick: () => void;
 11 |   showDrawerButton: boolean;
 12 |   onDrawerClick: () => void;
 13 |   isDrawerOpen: boolean;
 14 |   showNotificationDot?: boolean;
 15 |   label?: React.ReactNode;
 16 | }
 17 | 
 18 | /**
 19 |  * The footer at the bottom of a node, allowing a user to click it
 20 |  * to inspect responses.
 21 |  */
 22 | const InspectFooter: React.FC<InspectFooterProps> = ({
 23 |   label,
 24 |   onClick,
 25 |   showDrawerButton,
 26 |   onDrawerClick,
 27 |   isDrawerOpen,
 28 |   showNotificationDot,
 29 | }) => {
 30 |   const text = useMemo(
 31 |     () =>
 32 |       label ?? (
 33 |         <>
 34 |           Inspect responses&nbsp;
 35 |           <IconSearch size="12pt" />
 36 |         </>
 37 |       ),
 38 |     [label],
 39 |   );
 40 |   const inspectBtnWidth = useMemo(
 41 |     () => (showDrawerButton ? "84%" : "100%"),
 42 |     [showDrawerButton],
 43 |   );
 44 |   const drawerBtn = useMemo(() => {
 45 |     if (showDrawerButton)
 46 |       return (
 47 |         <Tooltip
 48 |           label={`${isDrawerOpen ? "Close" : "Open"} inspector drawer`}
 49 |           position="bottom"
 50 |           withArrow
 51 |           withinPortal
 52 |         >
 53 |           <Button
 54 |             color="blue"
 55 |             variant="subtle"
 56 |             w="16%"
 57 |             p="0px"
 58 |             onClick={onDrawerClick}
 59 |             style={{
 60 |               borderRadius: "0px",
 61 |               borderLeft: "1px solid #bdf",
 62 |               cursor: "pointer",
 63 |             }}
 64 |           >
 65 |             {isDrawerOpen ? (
 66 |               <IconSquareArrowLeft size="12pt" style={{ flexShrink: "0" }} />
 67 |             ) : (
 68 |               <IconSquareArrowRight size="12pt" style={{ flexShrink: "0" }} />
 69 |             )}
 70 |           </Button>
 71 |         </Tooltip>
 72 |       );
 73 |     else return undefined;
 74 |   }, [showDrawerButton, onDrawerClick, isDrawerOpen]);
 75 | 
 76 |   return (
 77 |     <div
 78 |       className="eval-inspect-response-footer nodrag"
 79 |       style={{ display: "flex", justifyContent: "center" }}
 80 |     >
 81 |       <Tooltip
 82 |         label="Open fullscreen inspector"
 83 |         position="bottom"
 84 |         withArrow
 85 |         withinPortal
 86 |       >
 87 |         <Button
 88 |           color="blue"
 89 |           variant="subtle"
 90 |           w={inspectBtnWidth}
 91 |           onClick={onClick}
 92 |         >
 93 |           {text}
 94 |           {showNotificationDot ? (
 95 |             <div className="something-changed-circle"></div>
 96 |           ) : (
 97 |             <></>
 98 |           )}
 99 |         </Button>
100 |       </Tooltip>
101 |       {drawerBtn}
102 |     </div>
103 |   );
104 | };
105 | 
106 | export default InspectFooter;
107 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/InspectorNode.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useState, useEffect, useContext } from "react";
  2 | import { Handle, Position } from "reactflow";
  3 | import useStore from "./store";
  4 | import BaseNode from "./BaseNode";
  5 | import NodeLabel from "./NodeLabelComponent";
  6 | import LLMResponseInspector, { exportToExcel } from "./LLMResponseInspector";
  7 | import { grabResponses } from "./backend/backend";
  8 | import { LLMResponse } from "./backend/typing";
  9 | import { AlertModalContext } from "./AlertModal";
 10 | 
 11 | export interface InspectorNodeProps {
 12 |   data: {
 13 |     title: string;
 14 |     input: string;
 15 |     refresh: boolean;
 16 |   };
 17 |   id: string;
 18 | }
 19 | 
 20 | const InspectorNode: React.FC<InspectorNodeProps> = ({ data, id }) => {
 21 |   let is_fetching = false;
 22 | 
 23 |   const [jsonResponses, setJSONResponses] = useState<LLMResponse[] | null>(
 24 |     null,
 25 |   );
 26 | 
 27 |   const [pastInputs, setPastInputs] = useState<string>("");
 28 |   const inputEdgesForNode = useStore((state) => state.inputEdgesForNode);
 29 |   const setDataPropsForNode = useStore((state) => state.setDataPropsForNode);
 30 |   const showAlert = useContext(AlertModalContext);
 31 | 
 32 |   const handleOnConnect = () => {
 33 |     // For some reason, 'on connect' is called twice upon connection.
 34 |     // We detect when an inspector node is already fetching, and disable the second call:
 35 |     if (is_fetching) return;
 36 | 
 37 |     // Get the ids from the connected input nodes:
 38 |     const input_node_ids = inputEdgesForNode(id).map((e) => e.source);
 39 | 
 40 |     is_fetching = true;
 41 | 
 42 |     // Grab responses associated with those ids:
 43 |     grabResponses(input_node_ids)
 44 |       .then(function (resps) {
 45 |         if (resps && resps.length > 0) setJSONResponses(resps);
 46 |         is_fetching = false;
 47 |       })
 48 |       .catch(() => {
 49 |         is_fetching = false;
 50 |       });
 51 |   };
 52 | 
 53 |   if (data.input) {
 54 |     // If there's a change in inputs...
 55 |     if (data.input !== pastInputs) {
 56 |       setPastInputs(data.input);
 57 |       handleOnConnect();
 58 |     }
 59 |   }
 60 | 
 61 |   useEffect(() => {
 62 |     if (data.refresh && data.refresh === true) {
 63 |       // Recreate the visualization:
 64 |       setDataPropsForNode(id, { refresh: false });
 65 |       handleOnConnect();
 66 |     }
 67 |   }, [data, id, handleOnConnect, setDataPropsForNode]);
 68 | 
 69 |   return (
 70 |     <BaseNode classNames="inspector-node" nodeId={id}>
 71 |       <NodeLabel
 72 |         title={data.title || "Inspect Node"}
 73 |         nodeId={id}
 74 |         icon={"🔍"}
 75 |         customButtons={[
 76 |           <button
 77 |             className="custom-button"
 78 |             key="export-data"
 79 |             onClick={() => {
 80 |               try {
 81 |                 exportToExcel(jsonResponses ?? []);
 82 |               } catch (e) {
 83 |                 showAlert && showAlert(e as Error);
 84 |               }
 85 |             }}
 86 |           >
 87 |             Export data
 88 |           </button>,
 89 |         ]}
 90 |       />
 91 |       <div
 92 |         className="inspect-response-container nowheel nodrag"
 93 |         style={{ marginTop: "-8pt" }}
 94 |       >
 95 |         <LLMResponseInspector
 96 |           jsonResponses={jsonResponses ?? []}
 97 |           isOpen={true}
 98 |           wideFormat={false}
 99 |         />
100 |       </div>
101 |       <Handle
102 |         type="target"
103 |         position={Position.Left}
104 |         id="input"
105 |         className="grouped-handle"
106 |         style={{ top: "50%" }}
107 |         onConnect={handleOnConnect}
108 |       />
109 |     </BaseNode>
110 |   );
111 | };
112 | 
113 | export default InspectorNode;
114 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/LLMItemButtonGroup.tsx:
--------------------------------------------------------------------------------
 1 | import React, { Button, Group, RingProgress } from "@mantine/core";
 2 | import { IconSettings, IconTrash } from "@tabler/icons-react";
 3 | import { QueryProgress } from "./backend/typing";
 4 | 
 5 | export function GatheringResponsesRingProgress({
 6 |   progress,
 7 | }: {
 8 |   progress: QueryProgress | undefined;
 9 | }) {
10 |   return progress !== undefined ? (
11 |     progress.success > 0 || progress.error > 0 ? (
12 |       <RingProgress
13 |         size={20}
14 |         thickness={3}
15 |         sections={[
16 |           {
17 |             value: progress.success,
18 |             color: progress.success < 99 ? "blue" : "green",
19 |           },
20 |           { value: progress.error, color: "red" },
21 |         ]}
22 |       />
23 |     ) : (
24 |       <div className="lds-ring">
25 |         <div></div>
26 |         <div></div>
27 |         <div></div>
28 |         <div></div>
29 |       </div>
30 |     )
31 |   ) : (
32 |     <></>
33 |   );
34 | }
35 | 
36 | export interface LLMItemButtonGroupProps {
37 |   onClickTrash?: () => void;
38 |   onClickSettings?: () => void;
39 |   ringProgress?: QueryProgress;
40 |   hideTrashIcon?: boolean;
41 | }
42 | 
43 | export default function LLMItemButtonGroup({
44 |   onClickTrash,
45 |   onClickSettings,
46 |   ringProgress,
47 |   hideTrashIcon,
48 | }: LLMItemButtonGroupProps) {
49 |   return (
50 |     <div>
51 |       <Group
52 |         position="right"
53 |         spacing="xs"
54 |         style={{ float: "right", height: "20px" }}
55 |       >
56 |         <GatheringResponsesRingProgress progress={ringProgress} />
57 |         {hideTrashIcon ? (
58 |           <></>
59 |         ) : (
60 |           <Button
61 |             onClick={onClickTrash}
62 |             size="xs"
63 |             variant="light"
64 |             compact
65 |             color="red"
66 |             style={{ padding: "0px" }}
67 |           >
68 |             <IconTrash size={"95%"} />
69 |           </Button>
70 |         )}
71 |         <Button
72 |           onClick={onClickSettings}
73 |           size="xs"
74 |           variant="light"
75 |           color="blue"
76 |           compact
77 |         >
78 |           <IconSettings size={"110%"} />
79 |         </Button>
80 |       </Group>
81 |     </div>
82 |   );
83 | }
84 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/LLMResponseInspectorDrawer.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import LLMResponseInspector from "./LLMResponseInspector";
 3 | import { LLMResponse } from "./backend/typing";
 4 | 
 5 | export interface LLMResponseInspectorDrawerProps {
 6 |   jsonResponses: LLMResponse[];
 7 |   showDrawer: boolean;
 8 | }
 9 | 
10 | export default function LLMResponseInspectorDrawer({
11 |   jsonResponses,
12 |   showDrawer,
13 | }: LLMResponseInspectorDrawerProps) {
14 |   return (
15 |     <div
16 |       className="inspect-responses-drawer"
17 |       style={{ display: showDrawer ? "initial" : "none" }}
18 |     >
19 |       <div
20 |         className="inspect-response-container nowheel nodrag"
21 |         style={{ margin: "0px 10px 10px 12px" }}
22 |       >
23 |         <LLMResponseInspector
24 |           jsonResponses={jsonResponses}
25 |           isOpen={showDrawer}
26 |           wideFormat={false}
27 |         />
28 |       </div>
29 |     </div>
30 |   );
31 | }
32 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/LLMResponseInspectorModal.tsx:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * A fullscreen version of the Inspect node that
  3 |  * appears in a Mantine modal pop-up which takes up much of the screen.
  4 |  */
  5 | import React, {
  6 |   forwardRef,
  7 |   useImperativeHandle,
  8 |   lazy,
  9 |   Suspense,
 10 |   useContext,
 11 | } from "react";
 12 | import { LoadingOverlay, Modal } from "@mantine/core";
 13 | import { useDisclosure } from "@mantine/hooks";
 14 | import { exportToExcel } from "./LLMResponseInspector";
 15 | import { LLMResponse } from "./backend/typing";
 16 | import { AlertModalContext } from "./AlertModal";
 17 | 
 18 | // Lazy load the inspector view
 19 | const LLMResponseInspector = lazy(() => import("./LLMResponseInspector"));
 20 | 
 21 | export interface LLMResponseInspectorModalRef {
 22 |   trigger: () => void;
 23 | }
 24 | 
 25 | export interface LLMResponseInspectorModalProps {
 26 |   jsonResponses: LLMResponse[];
 27 |   customLLMFieldName?: string;
 28 |   disableBackgroundColor?: boolean;
 29 |   treatLLMFieldAsUnique?: boolean;
 30 | }
 31 | 
 32 | const LLMResponseInspectorModal = forwardRef<
 33 |   LLMResponseInspectorModalRef,
 34 |   LLMResponseInspectorModalProps
 35 | >(function LLMResponseInspectorModal(props, ref) {
 36 |   // const inspectorRef = useRef(null);
 37 |   const [opened, { open, close }] = useDisclosure(false);
 38 |   const showAlert = useContext(AlertModalContext);
 39 |   // const [openedOnce, setOpenedOnce] = useState(false);
 40 | 
 41 |   // This gives the parent access to triggering the modal
 42 |   const trigger = () => {
 43 |     open();
 44 |     // if (inspectorRef.current) inspectorRef.current.triggerRedraw();
 45 |   };
 46 |   useImperativeHandle(ref, () => ({
 47 |     trigger,
 48 |   }));
 49 | 
 50 |   return (
 51 |     <Modal
 52 |       size="100%"
 53 |       keepMounted
 54 |       opened={opened}
 55 |       onClose={close}
 56 |       closeOnClickOutside={true}
 57 |       title={
 58 |         <div>
 59 |           <button
 60 |             className="custom-button"
 61 |             style={{
 62 |               marginTop: "auto",
 63 |               marginRight: "14px",
 64 |               float: "right",
 65 |               pointerEvents: "all",
 66 |             }}
 67 |             onClick={() => {
 68 |               try {
 69 |                 exportToExcel(props.jsonResponses);
 70 |               } catch (e) {
 71 |                 close();
 72 |                 showAlert && showAlert(e as Error);
 73 |               }
 74 |             }}
 75 |           >
 76 |             Export data to Excel
 77 |           </button>
 78 |         </div>
 79 |       }
 80 |       styles={{
 81 |         title: {
 82 |           justifyContent: "space-between",
 83 |           width: "100%",
 84 |           padding: "0px",
 85 |         },
 86 |         header: {
 87 |           paddingBottom: "0px",
 88 |           paddingTop: "12px",
 89 |           marginBottom: "-24px",
 90 |           backgroundColor: "transparent",
 91 |           pointerEvents: "none",
 92 |         },
 93 |         close: { pointerEvents: "all" },
 94 |       }}
 95 |     >
 96 |       <div
 97 |         className="inspect-modal-response-container"
 98 |         style={{ padding: "0px", overflow: "scroll" }}
 99 |       >
100 |         <Suspense fallback={<LoadingOverlay visible={true} />}>
101 |           <LLMResponseInspector
102 |             jsonResponses={props.jsonResponses}
103 |             isOpen={opened}
104 |             wideFormat={true}
105 |             customLLMFieldName={props.customLLMFieldName}
106 |             disableBackgroundColor={props.disableBackgroundColor}
107 |             treatLLMFieldAsUnique={props.treatLLMFieldAsUnique}
108 |           />
109 |         </Suspense>
110 |       </div>
111 |     </Modal>
112 |   );
113 | });
114 | 
115 | export default LLMResponseInspectorModal;
116 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/PlotLegend.tsx:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import { Dict } from "./backend/typing";
 3 | import { truncStr } from "./backend/utils";
 4 | 
 5 | export interface PlotLegendProps {
 6 |   labels: Dict<string>;
 7 |   onClickLabel: (label: string) => void;
 8 | }
 9 | 
10 | const PlotLegend: React.FC<PlotLegendProps> = ({ labels, onClickLabel }) => {
11 |   return (
12 |     <div className="plot-legend">
13 |       {Object.entries(labels).map(([label, color]) => (
14 |         <div
15 |           key={label}
16 |           className="plot-legend-item nodrag"
17 |           onClick={() => onClickLabel(label)}
18 |         >
19 |           <span
20 |             style={{
21 |               backgroundColor: color,
22 |               width: "10px",
23 |               height: "10px",
24 |               display: "inline-block",
25 |             }}
26 |           ></span>
27 |           <span style={{ marginLeft: "5px" }}>{truncStr(label, 56)}</span>
28 |         </div>
29 |       ))}
30 |     </div>
31 |   );
32 | };
33 | 
34 | export default PlotLegend;
35 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/RemoveEdge.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useState } from "react";
  2 | import styled from "styled-components";
  3 | import { BaseEdge, EdgeLabelRenderer, getBezierPath } from "@reactflow/core";
  4 | import useStore from "./store";
  5 | import { Position } from "reactflow";
  6 | import { Dict } from "./backend/typing";
  7 | import { useMantineColorScheme } from "@mantine/core";
  8 | 
  9 | const EdgePathContainer = styled.g`
 10 |   path {
 11 |     stroke: #999;
 12 |     transition: stroke 0.2s;
 13 |     pointer-events: all;
 14 |     &:hover {
 15 |       stroke: #000;
 16 |     }
 17 |   }
 18 | `;
 19 | 
 20 | export interface CustomEdgeProps {
 21 |   id: string;
 22 |   sourceX: number;
 23 |   sourceY: number;
 24 |   targetX: number;
 25 |   targetY: number;
 26 |   sourcePosition: Position;
 27 |   targetPosition: Position;
 28 |   style: Dict;
 29 |   markerEnd?: string;
 30 | }
 31 | 
 32 | export default function CustomEdge({
 33 |   id,
 34 |   sourceX,
 35 |   sourceY,
 36 |   targetX,
 37 |   targetY,
 38 |   sourcePosition,
 39 |   targetPosition,
 40 |   style = {},
 41 |   markerEnd,
 42 | }: CustomEdgeProps) {
 43 |   const [edgePath, labelX, labelY] = getBezierPath({
 44 |     sourceX,
 45 |     sourceY,
 46 |     sourcePosition,
 47 |     targetX,
 48 |     targetY,
 49 |     targetPosition,
 50 |   });
 51 | 
 52 |   const [hovering, setHovering] = useState(false);
 53 |   const removeEdge = useStore((state) => state.removeEdge);
 54 | 
 55 |   // Color theme
 56 |   const { colorScheme } = useMantineColorScheme();
 57 | 
 58 |   const onEdgeClick = (
 59 |     evt: React.MouseEvent<HTMLButtonElement>,
 60 |     id: string,
 61 |   ) => {
 62 |     evt.stopPropagation();
 63 |     removeEdge(id);
 64 |   };
 65 | 
 66 |   // Thanks in part to oshanley https://github.com/wbkd/react-flow/issues/1211#issuecomment-1585032930
 67 |   return (
 68 |     <EdgePathContainer
 69 |       onPointerEnter={() => setHovering(true)}
 70 |       onPointerLeave={() => setHovering(false)}
 71 |     >
 72 |       <BaseEdge
 73 |         path={edgePath}
 74 |         markerEnd={markerEnd}
 75 |         style={{
 76 |           ...style,
 77 |           stroke: hovering
 78 |             ? colorScheme === "light"
 79 |               ? "#000"
 80 |               : "#eee"
 81 |             : "#999",
 82 |         }}
 83 |       />
 84 |       <EdgeLabelRenderer>
 85 |         <div
 86 |           style={{
 87 |             position: "absolute",
 88 |             transform: `translate(-50%, -50%) translate(${labelX}px,${labelY}px)`,
 89 |             fontSize: 12,
 90 |             pointerEvents: "all",
 91 |             visibility: hovering ? "inherit" : "hidden",
 92 |           }}
 93 |           className="nodrag nopan"
 94 |         >
 95 |           <button
 96 |             className="remove-edge-btn"
 97 |             onClick={(event) => onEdgeClick(event, id)}
 98 |           >
 99 |             ×
100 |           </button>
101 |         </div>
102 |       </EdgeLabelRenderer>
103 |     </EdgePathContainer>
104 |   );
105 | }
106 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/RenameValueModal.tsx:
--------------------------------------------------------------------------------
 1 | import React, { forwardRef, useEffect, useImperativeHandle } from "react";
 2 | import { Modal, TextInput, Button, Box, Group } from "@mantine/core";
 3 | import { useForm } from "@mantine/form";
 4 | import { useDisclosure } from "@mantine/hooks";
 5 | 
 6 | export interface RenameValueModalProps {
 7 |   initialValue: string;
 8 |   title: string;
 9 |   label: string;
10 |   onSubmit?: (val: string) => void;
11 | }
12 | 
13 | export interface RenameValueModalRef {
14 |   trigger: (msg?: string) => void;
15 | }
16 | 
17 | /** Modal that lets user rename a single value, using a TextInput field. */
18 | const RenameValueModal = forwardRef<RenameValueModalRef, RenameValueModalProps>(
19 |   function RenameValueModal({ initialValue, title, label, onSubmit }, ref) {
20 |     const [opened, { open, close }] = useDisclosure(false);
21 |     const form = useForm({
22 |       initialValues: {
23 |         value: initialValue,
24 |       },
25 |       validate: {
26 |         value: (v) =>
27 |           v.trim().length > 0
28 |             ? null
29 |             : "Column names must have at least one character",
30 |       },
31 |     });
32 | 
33 |     useEffect(() => {
34 |       form.setValues({ value: initialValue });
35 |     }, [initialValue]);
36 | 
37 |     // This gives the parent access to triggering the modal alert
38 |     const trigger = () => {
39 |       open();
40 |     };
41 |     useImperativeHandle(ref, () => ({
42 |       trigger,
43 |     }));
44 | 
45 |     return (
46 |       <Modal opened={opened} onClose={close} title={title}>
47 |         <Box maw={300} mx="auto">
48 |           <form
49 |             onSubmit={form.onSubmit((values) => {
50 |               if (onSubmit) onSubmit(values.value);
51 |               close();
52 |             })}
53 |           >
54 |             <TextInput
55 |               withAsterisk
56 |               label={label}
57 |               autoFocus={true}
58 |               {...form.getInputProps("value")}
59 |             />
60 | 
61 |             <Group position="right" mt="md">
62 |               <Button type="submit">Submit</Button>
63 |             </Group>
64 |           </form>
65 |         </Box>
66 |       </Modal>
67 |     );
68 |   },
69 | );
70 | 
71 | export default RenameValueModal;
72 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/RequestClarificationModal.tsx:
--------------------------------------------------------------------------------
 1 | import React, { useEffect } from "react";
 2 | import { Modal, Button, TextInput, Flex, Text } from "@mantine/core";
 3 | import { useForm } from "@mantine/form";
 4 | 
 5 | export interface RequestClarificationModalProps {
 6 |   opened: boolean;
 7 |   title: string;
 8 |   desc?: string;
 9 |   initialValue?: string;
10 |   question: string;
11 |   onSubmit: (answer: string | null) => void;
12 |   validator?: (value: string) => string | null;
13 | }
14 | 
15 | // Requests clarification on a question before continuing.
16 | const RequestClarificationModal: React.FC<RequestClarificationModalProps> = ({
17 |   opened,
18 |   initialValue,
19 |   title,
20 |   desc,
21 |   question,
22 |   onSubmit,
23 |   validator,
24 | }) => {
25 |   // Create a form with Mantine's useForm hook
26 |   const form = useForm({
27 |     initialValues: {
28 |       answer: "",
29 |     },
30 | 
31 |     validate: {
32 |       answer: (value: string) => {
33 |         if (value.trim().length === 0) {
34 |           return "You must provide an answer";
35 |         }
36 |         if (validator) {
37 |           return validator(value);
38 |         }
39 |         return null;
40 |       },
41 |     },
42 |   });
43 | 
44 |   // Update the form value when the initialValue prop changes
45 |   useEffect(() => {
46 |     form.setFieldValue("answer", initialValue ?? "");
47 |   }, [initialValue]);
48 | 
49 |   // Handle form submission
50 |   const handleSubmit = (values: typeof form.values) => {
51 |     onSubmit(values.answer);
52 |     form.reset();
53 |   };
54 | 
55 |   return (
56 |     <Modal
57 |       opened={opened}
58 |       onClose={() => {
59 |         form.reset();
60 |       }}
61 |       closeOnEscape={false}
62 |       withCloseButton={false}
63 |       title={title}
64 |       centered
65 |       style={{ position: "relative", left: "-4%" }}
66 |     >
67 |       <form onSubmit={form.onSubmit(handleSubmit)}>
68 |         <TextInput
69 |           label={question}
70 |           description={desc}
71 |           placeholder="Type your answer here"
72 |           {...form.getInputProps("answer")}
73 |         />
74 | 
75 |         <Flex justify="space-between" mt="md">
76 |           <Button
77 |             variant="light"
78 |             color="gray"
79 |             onClick={(e) => {
80 |               e.preventDefault();
81 |               onSubmit(null);
82 |             }}
83 |           >
84 |             Cancel
85 |           </Button>
86 |           <Button type="submit" color="green">
87 |             Submit
88 |           </Button>
89 |         </Flex>
90 |       </form>
91 |     </Modal>
92 |   );
93 | };
94 | 
95 | export default RequestClarificationModal;
96 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/ScriptNode.tsx:
--------------------------------------------------------------------------------
  1 | import React, { useState, useEffect, useCallback } from "react";
  2 | import useStore from "./store";
  3 | import BaseNode from "./BaseNode";
  4 | import NodeLabel from "./NodeLabelComponent";
  5 | import { IconSettingsAutomation } from "@tabler/icons-react";
  6 | import { Dict } from "./backend/typing";
  7 | 
  8 | export interface ScriptNodeProps {
  9 |   data: {
 10 |     scriptFiles: Dict<string>;
 11 |     title: string;
 12 |   };
 13 |   id: string;
 14 | }
 15 | 
 16 | const ScriptNode: React.FC<ScriptNodeProps> = ({ data, id }) => {
 17 |   const setDataPropsForNode = useStore((state) => state.setDataPropsForNode);
 18 |   const delButtonId = "del-";
 19 |   const [idCounter, setIDCounter] = useState(0);
 20 |   const get_id = () => {
 21 |     setIDCounter(idCounter + 1);
 22 |     return "f" + idCounter.toString();
 23 |   };
 24 | 
 25 |   // Handle a change in a scripts' input.
 26 |   const handleInputChange = useCallback(
 27 |     (event: React.ChangeEvent<HTMLInputElement>) => {
 28 |       // Update the data for this script node's id.
 29 |       const new_data = { scriptFiles: { ...data.scriptFiles } };
 30 |       new_data.scriptFiles[event.target.id] = event.target.value;
 31 |       setDataPropsForNode(id, new_data);
 32 |     },
 33 |     [data, id, setDataPropsForNode],
 34 |   );
 35 | 
 36 |   // Handle delete script file.
 37 |   const handleDelete = useCallback(
 38 |     (event: React.MouseEvent<HTMLButtonElement>) => {
 39 |       // Update the data for this script node's id.
 40 |       const new_data = { scriptFiles: { ...data.scriptFiles } };
 41 |       const item_id = (event.target as HTMLButtonElement).id.substring(
 42 |         delButtonId.length,
 43 |       );
 44 |       delete new_data.scriptFiles[item_id];
 45 |       // if the new_data is empty, initialize it with one empty field
 46 |       if (Object.keys(new_data.scriptFiles).length === 0) {
 47 |         new_data.scriptFiles[get_id()] = "";
 48 |       }
 49 |       setDataPropsForNode(id, new_data);
 50 |     },
 51 |     [data, id, setDataPropsForNode],
 52 |   );
 53 | 
 54 |   // Initialize fields (run once at init)
 55 |   const [scriptFiles, setScriptFiles] = useState<React.ReactNode>([]);
 56 |   useEffect(() => {
 57 |     if (!data.scriptFiles)
 58 |       setDataPropsForNode(id, { scriptFiles: { [get_id()]: "" } });
 59 |   }, []);
 60 | 
 61 |   // Whenever 'data' changes, update the input fields to reflect the current state.
 62 |   useEffect(() => {
 63 |     const f = data.scriptFiles ? Object.keys(data.scriptFiles) : [];
 64 |     setScriptFiles(
 65 |       f.map((i) => {
 66 |         const val = data.scriptFiles ? data.scriptFiles[i] : "";
 67 |         return (
 68 |           <div className="input-field nodrag" key={i}>
 69 |             <input
 70 |               className="script-node-input"
 71 |               type="text"
 72 |               id={i}
 73 |               onChange={handleInputChange}
 74 |               value={val}
 75 |             ></input>
 76 |             <button
 77 |               className="remove-text-field-btn nodrag"
 78 |               id={delButtonId + i}
 79 |               onClick={handleDelete}
 80 |             >
 81 |               X
 82 |             </button>
 83 |             <br />
 84 |           </div>
 85 |         );
 86 |       }),
 87 |     );
 88 |   }, [data.scriptFiles, handleInputChange, handleDelete]);
 89 | 
 90 |   // Add a field
 91 |   const handleAddField = useCallback(() => {
 92 |     // Update the data for this script node's id.
 93 |     const new_data = { scriptFiles: { ...data.scriptFiles } };
 94 |     new_data.scriptFiles[get_id()] = "";
 95 |     setDataPropsForNode(id, new_data);
 96 |   }, [data, id, setDataPropsForNode]);
 97 | 
 98 |   return (
 99 |     <BaseNode classNames="script-node" nodeId={id}>
100 |       <NodeLabel
101 |         title={data.title || "Global Python Scripts"}
102 |         nodeId={id}
103 |         editable={false}
104 |         icon={<IconSettingsAutomation size="16px" />}
105 |       />
106 |       <label htmlFor="num-generations" style={{ fontSize: "10pt" }}>
107 |         Enter folder paths for external modules you wish to import.
108 |       </label>{" "}
109 |       <br />
110 |       <br />
111 |       <div>{scriptFiles}</div>
112 |       <div className="add-text-field-btn">
113 |         <button onClick={handleAddField}>+</button>
114 |       </div>
115 |     </BaseNode>
116 |   );
117 | };
118 | 
119 | export default ScriptNode;
120 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/StatusIndicatorComponent.tsx:
--------------------------------------------------------------------------------
 1 | import { IconCheck, IconX } from "@tabler/icons-react";
 2 | import React from "react";
 3 | 
 4 | export enum Status {
 5 |   WARNING = "warning",
 6 |   READY = "ready",
 7 |   ERROR = "error",
 8 |   LOADING = "loading",
 9 |   NONE = "none",
10 | }
11 | interface StatusIndicatorProps {
12 |   status: Status;
13 |   message?: string;
14 | }
15 | 
16 | export default function StatusIndicator({
17 |   status,
18 |   message,
19 | }: StatusIndicatorProps): React.ReactElement {
20 |   switch (status) {
21 |     case Status.WARNING: // Display mustard 'warning' icon
22 |       return (
23 |         <div className="status-icon warning-status">
24 |           &#9888;
25 |           <span className="status-tooltip">
26 |             {message ||
27 |               `Something changed. Downstream results might be invalidated. Press 
28 |             Play to rerun.`}
29 |           </span>
30 |         </div>
31 |       );
32 |     case Status.READY: // Display green checkmark 'ready' icon
33 |       return (
34 |         <div className="status-icon ready-status">
35 |           <IconCheck size={20} stroke={3} style={{ marginBottom: "-4px" }} />
36 |           <span className="status-tooltip">
37 |             {message || "Responses collected and ready."}
38 |           </span>
39 |         </div>
40 |       );
41 |     case Status.ERROR: // Display red 'error' icon
42 |       return (
43 |         <div className="status-icon error-status">
44 |           <IconX size={20} stroke={3} style={{ marginBottom: "-4px" }} />
45 |           <span className="status-tooltip">
46 |             {message || "Error collecting responses."}
47 |           </span>
48 |         </div>
49 |       );
50 |     case Status.LOADING: // Display animated 'loading' spinner icon
51 |       return (
52 |         <div className="lds-ring">
53 |           <div></div>
54 |           <div></div>
55 |           <div></div>
56 |           <div></div>
57 |         </div>
58 |       );
59 |     default:
60 |       return <></>;
61 |   }
62 | }
63 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/StrictModeDroppable.js:
--------------------------------------------------------------------------------
 1 | // StrictModeDroppable.tsx
 2 | // Credits to https://github.com/GiovanniACamacho and https://github.com/Meligy for the TypeScript version
 3 | // Original post: https://github.com/atlassian/react-beautiful-dnd/issues/2399#issuecomment-1175638194
 4 | import React, { useEffect, useState } from "react";
 5 | import { Droppable } from "react-beautiful-dnd";
 6 | export const StrictModeDroppable = ({ children, ...props }) => {
 7 |   const [enabled, setEnabled] = useState(false);
 8 |   useEffect(() => {
 9 |     const animation = window.requestAnimationFrame(() => setEnabled(true));
10 |     return () => {
11 |       window.cancelAnimationFrame(animation);
12 |       setEnabled(false);
13 |     };
14 |   }, []);
15 |   if (!enabled) {
16 |     return null;
17 |   }
18 |   return <Droppable {...props}>{children}</Droppable>;
19 | };
20 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/__test__/ai.test.ts:
--------------------------------------------------------------------------------
 1 | import { autofill, generateAndReplace } from "../ai";
 2 | 
 3 | const apiKeys = {
 4 |   OpenAI: process.env.OPENAI_API_KEY,
 5 |   AWS_Access_Key_ID: process.env.AWS_ACCESS_KEY_ID,
 6 |   AWS_Secret_Access_Key: process.env.AWS_SECRET_ACCESS_KEY,
 7 |   AWS_Session_Token: process.env.AWS_SESSION_TOKEN,
 8 | };
 9 | 
10 | describe("autofill-openai", () => {
11 |   if (!apiKeys.OpenAI) {
12 |     return;
13 |   }
14 |   it("should return an array of n rows", async () => {
15 |     const input = ["1", "2", "3", "4", "5"];
16 |     const n = 3;
17 |     const result = await autofill(input, n, "OpenAI", apiKeys);
18 |     expect(result).toHaveLength(n);
19 |     result.forEach((row) => {
20 |       expect(typeof row).toBe("string");
21 |     });
22 |   });
23 | });
24 | 
25 | describe("generateAndReplace-openai", () => {
26 |   if (!apiKeys.OpenAI) {
27 |     return;
28 |   }
29 |   it("should return an array of n rows", async () => {
30 |     const prompt = "animals";
31 |     const n = 3;
32 |     const result = await generateAndReplace(
33 |       prompt,
34 |       n,
35 |       false,
36 |       "OpenAI",
37 |       apiKeys,
38 |     );
39 |     expect(result).toHaveLength(n);
40 |     result.forEach((row) => {
41 |       expect(typeof row).toBe("string");
42 |     });
43 |   });
44 | });
45 | 
46 | describe("autofill-bedrock-anthropic", () => {
47 |   if (!apiKeys.AWS_Access_Key_ID) {
48 |     return;
49 |   }
50 |   it("should return an array of n rows", async () => {
51 |     const input = ["1", "2", "3", "4", "5"];
52 |     const n = 3;
53 |     const result = await autofill(input, n, "Bedrock", apiKeys);
54 |     expect(result).toHaveLength(n);
55 |     result.forEach((row) => {
56 |       expect(typeof row).toBe("string");
57 |     });
58 |   });
59 | });
60 | 
61 | describe("generateAndReplace-bedrock-anthropic", () => {
62 |   if (!apiKeys.AWS_Access_Key_ID) {
63 |     return;
64 |   }
65 |   it("should return an array of n rows", async () => {
66 |     const prompt = "animals";
67 |     const n = 3;
68 |     const result = await generateAndReplace(
69 |       prompt,
70 |       n,
71 |       false,
72 |       "Bedrock",
73 |       apiKeys,
74 |     );
75 |     expect(result).toHaveLength(n);
76 |     result.forEach((row) => {
77 |       expect(typeof row).toBe("string");
78 |     });
79 |   });
80 | });
81 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/__test__/aiSuggestionsManager.test.ts:
--------------------------------------------------------------------------------
 1 | import AISuggestionsManager from "../aiSuggestionsManager";
 2 | 
 3 | describe("AISuggestionsManager", () => {
 4 |   let suggestionsManager: AISuggestionsManager;
 5 |   let mockRows: string[];
 6 | 
 7 |   beforeEach(() => {
 8 |     suggestionsManager = new AISuggestionsManager(() => "OpenAI");
 9 |     mockRows = ["one", "two", "three"];
10 |   });
11 | 
12 |   describe("update", () => {
13 |     it("should clear suggestions if necessary", () => {
14 |       jest.useFakeTimers();
15 |       suggestionsManager.suggestions = [...mockRows];
16 |       suggestionsManager.update(["one", "", ""]);
17 |       jest.runAllTimers();
18 |       expect(suggestionsManager.suggestions).toEqual([]);
19 |     });
20 |   });
21 | 
22 |   describe("peekSuggestions", () => {
23 |     it("should return the current suggestions", () => {
24 |       suggestionsManager.suggestions = [...mockRows];
25 |       expect(suggestionsManager.peekSuggestions()).toEqual(mockRows);
26 |     });
27 |   });
28 | 
29 |   describe("popSuggestion", () => {
30 |     it("should return and remove the first suggestion by default", () => {
31 |       suggestionsManager.suggestions = [...mockRows];
32 |       const firstSuggestion = mockRows[0];
33 |       expect(suggestionsManager.popSuggestion()).toEqual(firstSuggestion);
34 |       expect(suggestionsManager.suggestions).toEqual(mockRows.slice(1));
35 |     });
36 | 
37 |     it("should return and remove the suggestion at the given index", () => {
38 |       suggestionsManager.suggestions = [...mockRows];
39 |       const secondSuggestion = mockRows[1];
40 |       expect(suggestionsManager.popSuggestion(1)).toEqual(secondSuggestion);
41 |       expect(suggestionsManager.suggestions).toEqual(
42 |         mockRows.slice(0, 1).concat(mockRows.slice(2)),
43 |       );
44 |     });
45 |   });
46 | 
47 |   describe("removeSuggestion", () => {
48 |     it("should remove the given suggestion", () => {
49 |       suggestionsManager.suggestions = [...mockRows];
50 |       const secondSuggestion = mockRows[1];
51 |       suggestionsManager.removeSuggestion(secondSuggestion);
52 |       expect(suggestionsManager.suggestions).toEqual(
53 |         mockRows.slice(0, 1).concat(mockRows.slice(2)),
54 |       );
55 |     });
56 |   });
57 | 
58 |   describe("areSuggestionsLoading", () => {
59 |     it("should return the current loading state", () => {
60 |       expect(suggestionsManager.areSuggestionsLoading()).toBe(false);
61 |       suggestionsManager.isLoading = true;
62 |       expect(suggestionsManager.areSuggestionsLoading()).toBe(true);
63 |     });
64 |   });
65 | 
66 |   describe("cycleSuggestions", () => {
67 |     it("should deterministically reorder the suggestions", () => {
68 |       suggestionsManager.suggestions = [...mockRows];
69 |       expect(suggestionsManager.peekSuggestions()).toEqual(mockRows);
70 |       suggestionsManager.cycleSuggestions();
71 |       // Except to be a recombination: not equal but set-equal
72 |       expect(suggestionsManager.peekSuggestions()).not.toEqual(mockRows);
73 |       expect(new Set(suggestionsManager.peekSuggestions())).toEqual(
74 |         new Set(mockRows),
75 |       );
76 |     });
77 |   });
78 | });
79 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/__test__/cache.test.ts:
--------------------------------------------------------------------------------
 1 | import { expect, test } from "@jest/globals";
 2 | import StorageCache from "../cache";
 3 | 
 4 | test("saving and loading cache data from localStorage", () => {
 5 |   // Store Unicode and numeric data into StorageCache
 6 |   StorageCache.store("hello", { a: "土", b: "ہوا", c: "火" });
 7 |   StorageCache.store("world", 42);
 8 | 
 9 |   // Verify stored data:
10 |   let d = StorageCache.get("hello");
11 |   expect(d).toHaveProperty("a");
12 |   expect(d?.a).toBe("土");
13 | 
14 |   // Save to localStorage
15 |   StorageCache.saveToLocalStorage("test");
16 | 
17 |   // Remove all data in the cache
18 |   StorageCache.clear();
19 | 
20 |   // Double-check there's no data:
21 |   d = StorageCache.get("hello");
22 |   expect(d).toBeUndefined();
23 | 
24 |   // Load cache from localStorage
25 |   StorageCache.loadFromLocalStorage("test", false);
26 | 
27 |   // Verify stored data:
28 |   d = StorageCache.get("hello");
29 |   expect(d).toHaveProperty("c");
30 |   expect(d?.c).toBe("火");
31 |   expect(StorageCache.get("world")).toBe(42);
32 | });
33 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/__test__/query.test.ts:
--------------------------------------------------------------------------------
  1 | /*
  2 |  * @jest-environment node
  3 |  */
  4 | import { PromptPipeline } from "../query";
  5 | import { LLM, LLMProvider, NativeLLM } from "../models";
  6 | import { expect, test } from "@jest/globals";
  7 | import { LLMResponseError, RawLLMResponseObject } from "../typing";
  8 | 
  9 | async function prompt_model(model: LLM, provider: LLMProvider): Promise<void> {
 10 |   const pipeline = new PromptPipeline(
 11 |     "What is the oldest {thing} in the world? Keep your answer brief.",
 12 |     model.toString(),
 13 |   );
 14 |   let responses: Array<RawLLMResponseObject | LLMResponseError> = [];
 15 |   for await (const response of pipeline.gen_responses(
 16 |     { thing: ["bar", "tree", "book"] },
 17 |     model,
 18 |     provider,
 19 |     1,
 20 |     1.0,
 21 |   )) {
 22 |     responses.push(response);
 23 |   }
 24 |   expect(responses).toHaveLength(3);
 25 | 
 26 |   // Double-check the cache'd results
 27 |   let cache = pipeline._load_cached_responses();
 28 |   Object.entries(cache).forEach(([prompt, response]) => {
 29 |     const r = Array.isArray(response) ? response[0] : response;
 30 |     console.log(`Prompt: ${prompt}\nResponse: ${r.responses[0]}`);
 31 |   });
 32 |   expect(Object.keys(cache)).toHaveLength(3); // expect 3 prompts
 33 | 
 34 |   // Now query ChatGPT again, but set n=2 to force it to send off 1 query per prompt.
 35 |   responses = [];
 36 |   for await (const response of pipeline.gen_responses(
 37 |     { thing: ["bar", "tree", "book"] },
 38 |     model,
 39 |     provider,
 40 |     2,
 41 |     1.0,
 42 |   )) {
 43 |     responses.push(response);
 44 |   }
 45 |   expect(responses).toHaveLength(3); // still 3
 46 |   responses.forEach((resp_obj) => {
 47 |     if (resp_obj instanceof LLMResponseError) return;
 48 |     expect(resp_obj.responses).toHaveLength(2); // each response object should have 2 candidates, as n=2
 49 |   });
 50 | 
 51 |   // Double-check the cache'd results
 52 |   cache = pipeline._load_cached_responses();
 53 |   Object.entries(cache).forEach(([prompt, response]) => {
 54 |     const resp_obj = Array.isArray(response) ? response[0] : response;
 55 |     console.log(
 56 |       `Prompt: ${prompt}\nResponses: ${JSON.stringify(resp_obj.responses)}`,
 57 |     );
 58 |     expect(resp_obj.responses).toHaveLength(2);
 59 |   });
 60 |   expect(Object.keys(cache)).toHaveLength(3); // still expect 3 prompts
 61 | 
 62 |   // Now send off the exact same query. It should use only the cache'd results:
 63 |   responses = [];
 64 |   for await (const response of pipeline.gen_responses(
 65 |     { thing: ["bar", "tree", "book"] },
 66 |     model,
 67 |     provider,
 68 |     2,
 69 |     1.0,
 70 |   )) {
 71 |     responses.push(response);
 72 |   }
 73 |   expect(responses).toHaveLength(3); // still 3
 74 |   responses.forEach((resp_obj) => {
 75 |     if (resp_obj instanceof LLMResponseError) return;
 76 |     expect(resp_obj.responses).toHaveLength(2); // each response object should have 2 candidates, as n=2
 77 |   });
 78 | 
 79 |   cache = pipeline._load_cached_responses();
 80 |   // eslint-disable-next-line
 81 |   Object.entries(cache).forEach(([prompt, response]) => {
 82 |     const resp_obj = Array.isArray(response) ? response[0] : response;
 83 |     expect(resp_obj.responses).toHaveLength(2);
 84 |   });
 85 |   expect(Object.keys(cache)).toHaveLength(3); // still expect 3 prompts
 86 | }
 87 | 
 88 | test("basic prompt pipeline with chatgpt", async () => {
 89 |   // Setup a simple pipeline with a prompt template, 1 variable and 3 input values
 90 |   await prompt_model(NativeLLM.OpenAI_ChatGPT, LLMProvider.OpenAI);
 91 | }, 20000);
 92 | 
 93 | test("basic prompt pipeline with anthropic", async () => {
 94 |   await prompt_model(NativeLLM.Claude_v1, LLMProvider.Anthropic);
 95 | }, 40000);
 96 | 
 97 | test("basic prompt pipeline with google palm2", async () => {
 98 |   await prompt_model(NativeLLM.PaLM2_Chat_Bison, LLMProvider.Google);
 99 | }, 40000);
100 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/__test__/setUtils.test.ts:
--------------------------------------------------------------------------------
  1 | import {
  2 |   union,
  3 |   isSubset,
  4 |   isExtension,
  5 |   isExtensionIgnoreEmpty,
  6 |   isEqual,
  7 | } from "../setUtils";
  8 | 
  9 | describe("setUtils", () => {
 10 |   describe("isEqual", () => {
 11 |     it("returns true if two sets are equal", () => {
 12 |       const setA = new Set([1, 2, 3]);
 13 |       const setB = new Set([1, 2, 3]);
 14 |       expect(isEqual(setA, setB)).toBe(true);
 15 |     });
 16 | 
 17 |     it("returns false if two sets are not equal", () => {
 18 |       const setA = new Set([1, 2, 3]);
 19 |       const setB = new Set([1, 2, 4]);
 20 |       expect(isEqual(setA, setB)).toBe(false);
 21 |     });
 22 |   });
 23 | 
 24 |   describe("union", () => {
 25 |     it("returns the union of two sets", () => {
 26 |       const setA = new Set([1, 2, 3]);
 27 |       const setB = new Set([2, 3, 4]);
 28 |       const expected = new Set([1, 2, 3, 4]);
 29 |       expect(union(setA, setB)).toEqual(expected);
 30 |     });
 31 |   });
 32 | 
 33 |   describe("isSubset", () => {
 34 |     it("returns true if A is a subset of B", () => {
 35 |       const setA = new Set([1, 2]);
 36 |       const setB = new Set([1, 2, 3]);
 37 |       expect(isSubset(setA, setB)).toBe(true);
 38 |     });
 39 | 
 40 |     it("returns false if A is not a subset of B", () => {
 41 |       const setA = new Set([1, 2, 3]);
 42 |       const setB = new Set([1, 2]);
 43 |       expect(isSubset(setA, setB)).toBe(false);
 44 |     });
 45 |   });
 46 | 
 47 |   describe("isExtension", () => {
 48 |     it("returns true if A is an extension of B and C", () => {
 49 |       const setA = new Set([1, 2, 3]);
 50 |       const setB = new Set([1, 2]);
 51 |       const setC = new Set([3, 4]);
 52 |       expect(isExtension(setA, setB, setC)).toBe(true);
 53 |     });
 54 | 
 55 |     it("returns false if A is not an extension of B and C", () => {
 56 |       const setA = new Set([1, 3, 4]);
 57 |       const setB = new Set([1, 2]);
 58 |       const setC = new Set([3, 4]);
 59 |       expect(isExtension(setA, setB, setC)).toBe(false);
 60 |     });
 61 |   });
 62 | 
 63 |   describe("isExtensionIgnoreEmpty", () => {
 64 |     it("returns true if A is an extension of B and C, ignoring empty strings", () => {
 65 |       const setA = ["", "1", "2", "", "3"];
 66 |       const setB = ["", "1", "2", ""];
 67 |       const setC = ["3", "4", ""];
 68 |       expect(isExtensionIgnoreEmpty(setA, setB, setC)).toBe(true);
 69 |     });
 70 | 
 71 |     it("returns false if A is not an extension of B and C, ignoring empty strings", () => {
 72 |       const setA = ["", "1", "3", "", "4"];
 73 |       const setB = ["", "1", "2", ""];
 74 |       const setC = ["3", "4", ""];
 75 |       expect(isExtensionIgnoreEmpty(setA, setB, setC)).toBe(false);
 76 |     });
 77 | 
 78 |     it("return true on this real-life color example", () => {
 79 |       const setA = [
 80 |         "Red",
 81 |         "Sky Blue",
 82 |         "Deep Purple",
 83 |         "Sunshine Yellow",
 84 |         "Midnight Black",
 85 |         "Emerald Green",
 86 |         "Electric Pink",
 87 |         "Arctic White",
 88 |         "",
 89 |         "",
 90 |       ];
 91 |       const setB = [
 92 |         "Red",
 93 |         "Sky Blue",
 94 |         "Deep Purple",
 95 |         "Sunshine Yellow",
 96 |         "Midnight Black",
 97 |         "Emerald Green",
 98 |         "Electric Pink",
 99 |         "",
100 |         "",
101 |         "",
102 |       ];
103 |       const setC = [
104 |         "Arctic White",
105 |         "Ocean Blue",
106 |         "Fiery Orange",
107 |         "Lavender Purple",
108 |         "Goldenrod Yellow",
109 |       ];
110 |       expect(isExtensionIgnoreEmpty(setA, setB, setC)).toBe(true);
111 |     });
112 |   });
113 | });
114 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/canceler.ts:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * A CancelTracker allows ids to be added, to signal
 3 |  * any associated processes should be 'canceled'. The tracker
 4 |  * operates as a global. It does not cancel anything itself,
 5 |  * but rather can be used to send a message to cancel a process
 6 |  * associated with 'id' (through .add(id)), which the process itself
 7 |  * checks (through .has(id)) and then performs the cancellation.
 8 |  */
 9 | export default class CancelTracker {
10 |   // eslint-disable-next-line no-use-before-define
11 |   private static instance: CancelTracker;
12 |   private data: Set<string | number>;
13 | 
14 |   private constructor() {
15 |     this.data = new Set();
16 |   }
17 | 
18 |   // Get the canceler
19 |   public static getInstance(): CancelTracker {
20 |     if (!CancelTracker.instance) CancelTracker.instance = new CancelTracker();
21 |     return CancelTracker.instance;
22 |   }
23 | 
24 |   // Add an id to trigger cancelation
25 |   private addId(id: string | number): void {
26 |     this.data.add(id);
27 |   }
28 | 
29 |   public static add(id: string | number): void {
30 |     CancelTracker.getInstance().addId(id);
31 |   }
32 | 
33 |   // Canceler has the given id
34 |   private hasId(id: string | number): boolean {
35 |     return this.data.has(id);
36 |   }
37 | 
38 |   public static has(id: string | number): boolean {
39 |     return CancelTracker.getInstance().hasId(id);
40 |   }
41 | 
42 |   // Clear id from the canceler
43 |   private clearId(id: string | number): void {
44 |     if (CancelTracker.has(id)) this.data.delete(id);
45 |   }
46 | 
47 |   public static clear(id: string | number): void {
48 |     CancelTracker.getInstance().clearId(id);
49 |   }
50 | 
51 |   private clearTracker(): void {
52 |     this.data.clear();
53 |   }
54 | 
55 |   public static clearAll(): void {
56 |     CancelTracker.getInstance().clearTracker();
57 |   }
58 | }
59 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/errors.ts:
--------------------------------------------------------------------------------
 1 | export class DuplicateVariableNameError extends Error {
 2 |   constructor(variable: string) {
 3 |     super();
 4 |     this.name = "DuplicateVariableNameError";
 5 |     this.message =
 6 |       "You have multiple template variables with the same name, {" +
 7 |       variable +
 8 |       "}. Duplicate names in the same chain is not allowed. To fix, ensure that all template variable names are unique across a chain.";
 9 |   }
10 | }
11 | 
12 | export class UserForcedPrematureExit extends Error {
13 |   constructor(id?: string) {
14 |     super();
15 |     this.name = "UserForcedPrematureExit";
16 |     this.message =
17 |       "You have forced the premature exit of the process" +
18 |       (id !== undefined ? ` with id ${id}` : "");
19 |   }
20 | }
21 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/evalgen/README.md:
--------------------------------------------------------------------------------
 1 | # `evalgen`: Grading and Evaluation Function Selection Module
 2 | 
 3 | This module takes a developer's prompt and set of examples (variables, prompts, responses), suggests evaluation criteria (with confirmation from developer + other criteria), generates and evaluates multiple functions per criteria on each of the examples, and returns the best function per criteria (most aligned with the developer's grades).
 4 | 
 5 | ## Execution
 6 | 
 7 | There is an interactive script to play with the functionality in `test.ts`. You can run it by running `ts-node test.ts` in the `grading` directory of the project. The terminal is a bit laggy sometimes.
 8 | 
 9 | ## Architecture
10 | 
11 | The module is divided into the following components: `executor`, `utils`, `oai_utils`.
12 | 
13 | ### Utils
14 | 
15 | This module contains types and prompts for criteria generation, function generation, and function execution.
16 | 
17 | ### OAI Utils
18 | 
19 | This module contains utilities for interacting with the OpenAI API.
20 | 
21 | ### Executor
22 | 
23 | This module contains the main logic for the module. It takes a developer's prompt and set of examples, as well as a list of evaluation criteria (which can be generated by the utils module). It has a background process to generate and evaluate functions for each criteria, updating each example's grading priority as function results stream in. There is a method to query the next example to grade, and another method to set the grade for an example. The module also has a method to query the best function per criteria (most aligned with the developer's grades).
24 | 
25 | # Credits
26 | 
27 | The `evalgen` module was created by Shreya Shankar. It was adapted to the ChainForge codebase by Ian Arawjo.
28 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/evalgen/oai_utils.ts:
--------------------------------------------------------------------------------
 1 | // import { env as process_env } from "process";
 2 | import { EventEmitter } from "events";
 3 | // import { AzureKeyCredential, OpenAIClient } from "@azure/openai";
 4 | import { hashtagTemplateVars, llmResponseDataToString } from "../utils";
 5 | import { simpleQueryLLM } from "../backend";
 6 | import { Dict, LLMSpec } from "../typing";
 7 | import { extractMdBlocks } from "./utils";
 8 | type ContentType = "python_fn" | "llm_eval";
 9 | 
10 | export class EvalGenAssertionEmitter extends EventEmitter {
11 |   private apiKeys: Dict | undefined;
12 | 
13 |   constructor(apiKeys?: Dict) {
14 |     super();
15 |     this.apiKeys = apiKeys;
16 |   }
17 | 
18 |   async generate(
19 |     prompt: string,
20 |     llm: string | LLMSpec,
21 |     contentType: ContentType,
22 |   ): Promise<void> {
23 |     const emit_prompt = (p: string) => this.emit("function", p);
24 | 
25 |     const result = await simpleQueryLLM(
26 |       prompt, // prompt
27 |       typeof llm === "string" ? llm : [llm], // llm
28 |       // spec, // llm
29 |       "You are an expert Python programmer and helping me write assertions for my LLM pipeline. An LLM pipeline accepts an example and prompt template, fills the template's placeholders with the example, and generates a response.", // system_msg
30 |       this.apiKeys, // API keys (if any)
31 |     );
32 | 
33 |     if (result.errors && Object.keys(result.errors).length > 0)
34 |       throw new Error(Object.values(result.errors as Dict)[0].toString());
35 | 
36 |     // Get output (text from LLM response)
37 |     const output = llmResponseDataToString(result.responses[0].responses[0]);
38 |     console.log("Streamer: LLM said: ", output); // for debuggging
39 | 
40 |     // Attempt to extract output depending on content type
41 |     if (contentType === "llm_eval") {
42 |       // Expected output is a ``json block that is just a list of three strings representing the prompts i.e. ["str1", "str2", "str3"]
43 |       // Attempt to extract JSON blocks (strings) from output
44 |       const json_blocks = extractMdBlocks(output, "json");
45 |       if (json_blocks === undefined || json_blocks.length === 0)
46 |         throw new Error(
47 |           "EvalGen: Could not parse LLM response into evaluation prompt: No JSON detected in output.",
48 |         );
49 | 
50 |       // If we passed, this should be a list of strings:
51 |       const prompts = json_blocks.flatMap((b) => JSON.parse(b));
52 |       // Verify format:
53 |       if (prompts.every((p) => typeof p === "string")) {
54 |         // If these are all strings, we are good to go--
55 |         // We must be careful to first hashtag all template variables in the prompt
56 |         // before emitting them, so that they are not interpreted as template variables.
57 |         const hashtagged_prompts = prompts.map((p) => hashtagTemplateVars(p));
58 |         // Emit all the LLM eval prompt candidates in one burst
59 |         hashtagged_prompts.forEach(emit_prompt);
60 |       } else {
61 |         console.error(
62 |           "Unexpected output type after JSON parsing: At least generated LLM eval prompt is not a string.",
63 |           prompts,
64 |         );
65 |         throw new Error("Unexpected output type after JSON parsing");
66 |       }
67 |     } else if (contentType === "python_fn") {
68 |       // Expected output has ~3 Python codeblocks within ```python markers
69 |       // Attempt to extract code blocks from output
70 |       const code_blocks = extractMdBlocks(output, "python");
71 |       if (code_blocks === undefined || code_blocks.length === 0)
72 |         throw new Error(
73 |           "EvalGen: Could not parse LLM response into Python function: No code detected in output.",
74 |         );
75 | 
76 |       // If we passed, this should be a list of Python code functions. We assume it is OK, and treat them separately:
77 |       code_blocks.forEach(emit_prompt);
78 |     } else {
79 |       throw new Error("Unknown content type: " + contentType);
80 |     }
81 | 
82 |     this.emit("end"); // Signal that streaming is complete
83 |   }
84 | }
85 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/evalgen/test.ts:
--------------------------------------------------------------------------------
  1 | // import fs from "fs";
  2 | // import csvParser from "csv-parser";
  3 | // import readline from "readline";
  4 | 
  5 | // import { Example, EvalCriteria, generateLLMEvaluationCriteria } from "./utils";
  6 | // import EvaluationFunctionExecutor from "./executor";
  7 | 
  8 | // const readCSV = async (filePath: string): Promise<Example[]> => {
  9 | //   const examples: Example[] = [];
 10 | //   let counter = 0; // Counter to generate unique IDs
 11 | 
 12 | //   return new Promise((resolve, reject) => {
 13 | //     fs.createReadStream(filePath)
 14 | //       .pipe(csvParser(["prompt", "example", "response", "model"]))
 15 | //       .on("data", (data) => {
 16 | //         try {
 17 | //           examples.push({
 18 | //             id: `example_${++counter}`, // Generating a unique ID
 19 | //             variables: data.example,
 20 | //             prompt: data.prompt,
 21 | //             response: data.response,
 22 | //           });
 23 | //         } catch (error) {
 24 | //           // console.error("Error parsing variables from CSV:", error);
 25 | //           // Don't throw here, just skip the example
 26 | //         }
 27 | //       })
 28 | //       .on("end", () => resolve(examples))
 29 | //       .on("error", reject);
 30 | //   });
 31 | // };
 32 | 
 33 | // const rl = readline.createInterface({
 34 | //   input: process.stdin,
 35 | //   output: process.stdout,
 36 | // });
 37 | 
 38 | // const askQuestion = (query: string): Promise<string> =>
 39 | //   new Promise((resolve) => rl.question(query, resolve));
 40 | 
 41 | // const main = async () => {
 42 | //   // Placeholder values - replace with actual data
 43 | //   const promptTemplate = `You are an AI Assistant that’s an expert at reviewing pull requests. Review the below pull request that you receive.
 44 | 
 45 | //   Input format
 46 | //   - The input format follows Github diff format with addition and subtraction of code.
 47 | //   - The + sign means that code has been added.
 48 | //   - The - sign means that code has been removed.
 49 | 
 50 | //   Instructions
 51 | //   - Take into account that you don’t have access to the full code but only the code diff.
 52 | //   - Only answer on what can be improved and provide the improvement in code.
 53 | //   - Answer in short form.
 54 | //   - Include code snippets if necessary.
 55 | //   - Adhere to the languages code conventions.
 56 | //   - Make it personal and always show gratitude to the author using "@" when tagging.`;
 57 | 
 58 | //   let examples: Example[] = await readCSV("./codereviews.csv");
 59 | 
 60 | //   // Get a sample of 10 examples
 61 | //   examples = examples.slice(0, 10);
 62 | 
 63 | //   // Print number of examples
 64 | //   console.log(`Loaded ${examples.length} examples.`);
 65 | 
 66 | //   // Start a timer
 67 | //   let start = Date.now();
 68 | //   let timeElapsed = 0;
 69 | 
 70 | //   // Step 1: Suggest eval criteria and solicit approval
 71 | //   const evalCriteria = await generateLLMEvaluationCriteria(promptTemplate);
 72 | //   // Pause the timer
 73 | //   timeElapsed += Date.now() - start;
 74 | 
 75 | //   const approval = await askQuestion(
 76 | //     "Do you approve the suggested criteria? (y/n) ",
 77 | //   );
 78 | 
 79 | //   if (approval.toLowerCase() !== "y") {
 80 | //     console.log(
 81 | //       "Please adjust the criteria directly in the source code for now.",
 82 | //     );
 83 | //     return;
 84 | //   }
 85 | 
 86 | //   const executor = new EvaluationFunctionExecutor(
 87 | //     promptTemplate,
 88 | //     examples,
 89 | //   );
 90 | 
 91 | //   // Set the evaluation criteria
 92 | //   executor.setEvaluationCriteria(evalCriteria);
 93 | 
 94 | //   // Resume the timer
 95 | //   start = Date.now();
 96 | 
 97 | //   // Step 2: Start background task
 98 | //   executor.start();
 99 | 
100 | //   //   await executor.waitForCompletion();
101 | 
102 | //   //   Step 3: Present examples to grade
103 | //   while (true) {
104 | //     // Get ungraded scores
105 | //     const ungradedScores = executor.getUngradedScores();
106 | //     console.log("Ungraded Scores: ", ungradedScores);
107 | 
108 | //     const nextExampleId = executor.getNextExampleToGrade();
109 | //     if (!nextExampleId) {
110 | //       console.log("All examples graded or no examples available.");
111 | //       break;
112 | //     }
113 | 
114 | //     const example = examples.find((e) => e.id === nextExampleId);
115 | //     if (!example) continue;
116 | 
117 | //     console.log(
118 | //       `Example ID: ${example.id}, Prompt: ${example.prompt}, Response: ${example.response}`,
119 | //     );
120 | //     const grade = await askQuestion(
121 | //       "Is this response acceptable? (y/n/finish) ",
122 | //     );
123 | 
124 | //     if (grade === "finish") {
125 | //       break;
126 | //     }
127 | 
128 | //     executor.setGradeForExample(example.id, grade.toLowerCase() === "y");
129 | //   }
130 | 
131 | //   // Print grades
132 | //   console.log("Grades: ", executor.getGrades());
133 | 
134 | //   // Step 4: Filtering and results
135 | //   //   await executor.waitForCompletion();
136 | //   const filteredFunctions = await executor.filterEvaluationFunctions(0.2);
137 | //   console.log("Filtered Functions: ", filteredFunctions);
138 | 
139 | //   rl.close();
140 | // };
141 | 
142 | // main().catch(console.error);
143 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/evalgen/typing.ts:
--------------------------------------------------------------------------------
 1 | import { ChatHistoryInfo, Dict } from "../typing";
 2 | 
 3 | export type EvalCriteriaUID = string;
 4 | 
 5 | export interface EvalCriteria {
 6 |   shortname: string;
 7 |   criteria: string;
 8 |   eval_method: "code" | "expert";
 9 |   uid: EvalCriteriaUID;
10 |   priority: number;
11 |   source?: string;
12 | }
13 | 
14 | export interface EvalGenReport {
15 |   criteria: EvalCriteria[];
16 |   failureCoverage: number;
17 |   falseFailureRate: number;
18 | }
19 | 
20 | export function validEvalCriteriaFormat(json_obj: Dict) {
21 |   return (
22 |     "criteria" in json_obj &&
23 |     "shortname" in json_obj &&
24 |     ["code", "expert"].includes(json_obj.eval_method)
25 |   );
26 | }
27 | 
28 | export enum EvalFunctionResult {
29 |   PASS = "pass",
30 |   FAIL = "fail",
31 |   SKIP = "skip",
32 | }
33 | 
34 | export interface EvalFunction {
35 |   evalCriteria: EvalCriteria;
36 |   code: string;
37 |   name: string;
38 |   uid: string;
39 | }
40 | 
41 | export interface EvalFunctionReport {
42 |   evalFunction: EvalFunction;
43 |   true_pass: number;
44 |   true_fail: number;
45 |   false_pass: number;
46 |   false_fail: number;
47 |   skipped: number;
48 |   mcc?: number; // Matthews correlation coefficient, which is a measure of the quality of binary classifications
49 |   f1?: number; // F1 score, which is the harmonic mean of precision and recall
50 |   cohens_kappa?: number; // Cohen's kappa, which is a measure of inter-rater agreement
51 |   failureCoverage?: number; // The percentage of failures that were covered by the eval function
52 |   falseFailureRate?: number; // The percentage of false failures
53 | }
54 | 
55 | export interface EvalFunctionSetReport {
56 |   failureCoverage: number;
57 |   falseFailureRate: number;
58 |   selectedEvalFunctions: EvalFunction[];
59 |   allEvalFunctionReports: Map<EvalCriteria, EvalFunctionReport[]>; // Map from criteria to function reports
60 | }
61 | 
62 | export class EvalExecutionError extends Error {
63 |   constructor(message: string) {
64 |     super(message); // Call the parent constructor with the message
65 |     this.name = "EvalExecutionError"; // Set the error name to the class name
66 |     Object.setPrototypeOf(this, EvalExecutionError.prototype);
67 |   }
68 | }
69 | 
70 | export const AssertionWriterSystemMsg =
71 |   "You are an expert Python programmer and helping me write assertions for my LLM pipeline. An LLM pipeline accepts an example and prompt template, fills the template's placeholders with the example, and generates a response.";
72 | export const AssertionWriterSystemMsgChatHistory: ChatHistoryInfo[] = [
73 |   {
74 |     messages: [
75 |       {
76 |         role: "system",
77 |         content: AssertionWriterSystemMsg,
78 |       },
79 |     ],
80 |     fill_history: {},
81 |   },
82 | ];
83 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/pyodide/exec-py.js:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * Executes Python code in browser sandbox with pyodide.
 3 |  *
 4 |  * Code adapted from https://pyodide.org/en/stable/usage/webworker.html
 5 |  */
 6 | 
 7 | import { v4 as uuid } from "uuid";
 8 | 
 9 | // Setup
10 | let pyodideWorker = undefined;
11 | const callbacks = {};
12 | 
13 | const execPy = (() => {
14 |   return (script, context) => {
15 |     // Initalize the worker only when first called, to save on load times
16 |     if (!pyodideWorker) {
17 |       pyodideWorker = new Worker(
18 |         new URL("./exec-py.worker.js", import.meta.url),
19 |       );
20 |       pyodideWorker.onmessage = (event) => {
21 |         const { id, ...data } = event.data;
22 |         const onSuccess = callbacks[id];
23 |         delete callbacks[id];
24 |         onSuccess(data);
25 |       };
26 |     }
27 | 
28 |     let id = uuid();
29 | 
30 |     // Execute the worker
31 |     return new Promise((onSuccess) => {
32 |       callbacks[id] = onSuccess;
33 |       pyodideWorker.postMessage({
34 |         ...context,
35 |         python: script,
36 |         id,
37 |       });
38 |     });
39 |   };
40 | })();
41 | 
42 | export { execPy };
43 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/pyodide/exec-py.worker.js:
--------------------------------------------------------------------------------
 1 | // WebWorker code adapted from https://pyodide.org/en/stable/usage/webworker.html
 2 | 
 3 | // Import Pyodide script:
 4 | importScripts("https://cdn.jsdelivr.net/pyodide/v0.25.0/full/pyodide.js");
 5 | 
 6 | async function loadPyodideAndPackages() {
 7 |   self.pyodide = await loadPyodide();
 8 | 
 9 |   // Here, we can load any packages we wish. For now, this feature is disabled:
10 |   // await self.pyodide.loadPackage(["numpy", "pytz"]);
11 | }
12 | let pyodideReadyPromise = loadPyodideAndPackages();
13 | 
14 | self.onmessage = async function (event) {
15 |   // make sure loading is done
16 |   await pyodideReadyPromise;
17 |   // Don't bother yet with this line, suppose our API is built in such a way:
18 |   const { id, python, ...context } = event.data;
19 |   // The worker copies the context in its own "memory" (an object mapping name to values)
20 |   for (const key of Object.keys(context)) {
21 |     self[key] = context[key];
22 |   }
23 |   // Now is the easy part, the one that is similar to working in the main thread:
24 |   try {
25 |     await self.pyodide.loadPackagesFromImports(python);
26 |     let results = await self.pyodide.runPythonAsync(python);
27 |     self.postMessage({ results, id });
28 |   } catch (error) {
29 |     self.postMessage({ error: error.message, id });
30 |   }
31 | };
32 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/setUtils.ts:
--------------------------------------------------------------------------------
 1 | // Returns whether two sets are equal.
 2 | export function isEqual<T>(a: Set<T>, b: Set<T>): boolean {
 3 |   return isSubset(a, b) && isSubset(b, a);
 4 | }
 5 | 
 6 | // Returns the union of two sets.
 7 | export function union<T>(a: Set<T>, b: Set<T>): Set<T> {
 8 |   return new Set([...a, ...b]);
 9 | }
10 | 
11 | // Returns whether A is a subset of B.
12 | export function isSubset<T>(a: Set<T>, b: Set<T>): boolean {
13 |   return [...a].every((x) => b.has(x));
14 | }
15 | 
16 | export function isSuperset<T>(a: Set<T>, b: Set<T>): boolean {
17 |   return isSubset(b, a);
18 | }
19 | 
20 | export function subtract<T>(a: Set<T>, b: Set<T>): Set<T> {
21 |   return new Set([...a].filter((x) => !b.has(x)));
22 | }
23 | 
24 | // A is an "extension" of B and C if
25 | // (1) A is a superset of B
26 | // (2) The elements in A that are not in B are a subset of C.
27 | export function isExtension<T>(a: Set<T>, b: Set<T>, c: Set<T>): boolean {
28 |   return isSuperset(a, b) && isSubset(subtract(a, b), c);
29 | }
30 | 
31 | // Returns whether A is an "extension" of B and C, ignoring empty strings.
32 | export function isExtensionIgnoreEmpty(a: string[], b: string[], c: string[]) {
33 |   const emptyStringFilter = (x: string) => x !== "";
34 |   return isExtension(
35 |     new Set(a.filter(emptyStringFilter)),
36 |     new Set(b.filter(emptyStringFilter)),
37 |     new Set(c.filter(emptyStringFilter)),
38 |   );
39 | }
40 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/backend/tableUtils.ts:
--------------------------------------------------------------------------------
 1 | import { v4 as uuidv4 } from "uuid";
 2 | import { Dict, TabularDataRowType, TabularDataColType } from "./typing";
 3 | /*
 4 |   This file contains utility functions for parsing raw table data
 5 |   into a format for TabularDataNode
 6 | */
 7 | export function parseTableData(rawTableData: any[]): {
 8 |   columns: TabularDataColType[];
 9 |   rows: TabularDataRowType[];
10 | } {
11 |   if (!Array.isArray(rawTableData)) {
12 |     throw new Error(
13 |       "Table data is not in array format: " +
14 |         (rawTableData !== undefined && rawTableData !== null
15 |           ? String(rawTableData)
16 |           : ""),
17 |     );
18 |   }
19 | 
20 |   // Extract unique column names
21 |   const headers = new Set<string>();
22 |   rawTableData.forEach((row) =>
23 |     Object.keys(row).forEach((key) => headers.add(key)),
24 |   );
25 | 
26 |   // Create columns with unique IDs
27 |   const columns = Array.from(headers).map((header, idx) => ({
28 |     header,
29 |     key: `c${idx}`,
30 |   }));
31 | 
32 |   // Create a lookup table for column keys
33 |   const columnKeyLookup: Dict<string> = {};
34 |   columns.forEach((col) => {
35 |     columnKeyLookup[col.header] = col.key;
36 |   });
37 | 
38 |   // Map rows to the new column keys
39 |   const rows = rawTableData.map((row) => {
40 |     const parsedRow: TabularDataRowType = { __uid: uuidv4() };
41 |     Object.keys(row).forEach((header) => {
42 |       const rawValue = row[header];
43 |       const value =
44 |         typeof rawValue === "object" ? JSON.stringify(rawValue) : rawValue;
45 |       parsedRow[columnKeyLookup[header]] = value?.toString() ?? "";
46 |     });
47 |     return parsedRow;
48 |   });
49 | 
50 |   return { columns, rows };
51 | }
52 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/index.css:
--------------------------------------------------------------------------------
 1 | body {
 2 |   margin: 0;
 3 |   font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", "Roboto", "Oxygen",
 4 |     "Ubuntu", "Cantarell", "Fira Sans", "Droid Sans", "Helvetica Neue",
 5 |     sans-serif;
 6 |   -webkit-font-smoothing: antialiased;
 7 |   -moz-osx-font-smoothing: grayscale;
 8 | }
 9 | 
10 | code {
11 |   font-family: Menlo, Monaco, Consolas, "Courier New", monospace;
12 | }
13 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/index.js:
--------------------------------------------------------------------------------
 1 | import React from "react";
 2 | import ReactDOM from "react-dom/client";
 3 | import "./index.css";
 4 | import App from "./App";
 5 | import reportWebVitals from "./reportWebVitals";
 6 | import { ContextMenuProvider } from "mantine-contextmenu";
 7 | import { AlertModalProvider } from "./AlertModal";
 8 | import ColorThemeProvider from "./ColorThemeProvider";
 9 | 
10 | const root = ReactDOM.createRoot(document.getElementById("root"));
11 | root.render(
12 |   <React.StrictMode>
13 |     <ColorThemeProvider>
14 |       <AlertModalProvider>
15 |         <ContextMenuProvider>
16 |           <App />
17 |         </ContextMenuProvider>
18 |       </AlertModalProvider>
19 |     </ColorThemeProvider>
20 |   </React.StrictMode>,
21 | );
22 | 
23 | // If you want to start measuring performance in your app, pass a function
24 | // to log results (for example: reportWebVitals(console.log))
25 | // or send to an analytics endpoint. Learn more: https://bit.ly/CRA-vitals
26 | reportWebVitals();
27 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/logo.svg:
--------------------------------------------------------------------------------
1 | <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 841.9 595.3"><g fill="#61DAFB"><path d="M666.3 296.5c0-32.5-40.7-63.3-103.1-82.4 14.4-63.6 8-114.2-20.2-130.4-6.5-3.8-14.1-5.6-22.4-5.6v22.3c4.6 0 8.3.9 11.4 2.6 13.6 7.8 19.5 37.5 14.9 75.7-1.1 9.4-2.9 19.3-5.1 29.4-19.6-4.8-41-8.5-63.5-10.9-13.5-18.5-27.5-35.3-41.6-50 32.6-30.3 63.2-46.9 84-46.9V78c-27.5 0-63.5 19.6-99.9 53.6-36.4-33.8-72.4-53.2-99.9-53.2v22.3c20.7 0 51.4 16.5 84 46.6-14 14.7-28 31.4-41.3 49.9-22.6 2.4-44 6.1-63.6 11-2.3-10-4-19.7-5.2-29-4.7-38.2 1.1-67.9 14.6-75.8 3-1.8 6.9-2.6 11.5-2.6V78.5c-8.4 0-16 1.8-22.6 5.6-28.1 16.2-34.4 66.7-19.9 130.1-62.2 19.2-102.7 49.9-102.7 82.3 0 32.5 40.7 63.3 103.1 82.4-14.4 63.6-8 114.2 20.2 130.4 6.5 3.8 14.1 5.6 22.5 5.6 27.5 0 63.5-19.6 99.9-53.6 36.4 33.8 72.4 53.2 99.9 53.2 8.4 0 16-1.8 22.6-5.6 28.1-16.2 34.4-66.7 19.9-130.1 62-19.1 102.5-49.9 102.5-82.3zm-130.2-66.7c-3.7 12.9-8.3 26.2-13.5 39.5-4.1-8-8.4-16-13.1-24-4.6-8-9.5-15.8-14.4-23.4 14.2 2.1 27.9 4.7 41 7.9zm-45.8 106.5c-7.8 13.5-15.8 26.3-24.1 38.2-14.9 1.3-30 2-45.2 2-15.1 0-30.2-.7-45-1.9-8.3-11.9-16.4-24.6-24.2-38-7.6-13.1-14.5-26.4-20.8-39.8 6.2-13.4 13.2-26.8 20.7-39.9 7.8-13.5 15.8-26.3 24.1-38.2 14.9-1.3 30-2 45.2-2 15.1 0 30.2.7 45 1.9 8.3 11.9 16.4 24.6 24.2 38 7.6 13.1 14.5 26.4 20.8 39.8-6.3 13.4-13.2 26.8-20.7 39.9zm32.3-13c5.4 13.4 10 26.8 13.8 39.8-13.1 3.2-26.9 5.9-41.2 8 4.9-7.7 9.8-15.6 14.4-23.7 4.6-8 8.9-16.1 13-24.1zM421.2 430c-9.3-9.6-18.6-20.3-27.8-32 9 .4 18.2.7 27.5.7 9.4 0 18.7-.2 27.8-.7-9 11.7-18.3 22.4-27.5 32zm-74.4-58.9c-14.2-2.1-27.9-4.7-41-7.9 3.7-12.9 8.3-26.2 13.5-39.5 4.1 8 8.4 16 13.1 24 4.7 8 9.5 15.8 14.4 23.4zM420.7 163c9.3 9.6 18.6 20.3 27.8 32-9-.4-18.2-.7-27.5-.7-9.4 0-18.7.2-27.8.7 9-11.7 18.3-22.4 27.5-32zm-74 58.9c-4.9 7.7-9.8 15.6-14.4 23.7-4.6 8-8.9 16-13 24-5.4-13.4-10-26.8-13.8-39.8 13.1-3.1 26.9-5.8 41.2-7.9zm-90.5 125.2c-35.4-15.1-58.3-34.9-58.3-50.6 0-15.7 22.9-35.6 58.3-50.6 8.6-3.7 18-7 27.7-10.1 5.7 19.6 13.2 40 22.5 60.9-9.2 20.8-16.6 41.1-22.2 60.6-9.9-3.1-19.3-6.5-28-10.2zM310 490c-13.6-7.8-19.5-37.5-14.9-75.7 1.1-9.4 2.9-19.3 5.1-29.4 19.6 4.8 41 8.5 63.5 10.9 13.5 18.5 27.5 35.3 41.6 50-32.6 30.3-63.2 46.9-84 46.9-4.5-.1-8.3-1-11.3-2.7zm237.2-76.2c4.7 38.2-1.1 67.9-14.6 75.8-3 1.8-6.9 2.6-11.5 2.6-20.7 0-51.4-16.5-84-46.6 14-14.7 28-31.4 41.3-49.9 22.6-2.4 44-6.1 63.6-11 2.3 10.1 4.1 19.8 5.2 29.1zm38.5-66.7c-8.6 3.7-18 7-27.7 10.1-5.7-19.6-13.2-40-22.5-60.9 9.2-20.8 16.6-41.1 22.2-60.6 9.9 3.1 19.3 6.5 28.1 10.2 35.4 15.1 58.3 34.9 58.3 50.6-.1 15.7-23 35.6-58.4 50.6zM320.8 78.4z"/><circle cx="420.9" cy="296.5" r="45.7"/><path d="M520.5 78.1z"/></g></svg>


--------------------------------------------------------------------------------
/chainforge/react-server/src/reportWebVitals.js:
--------------------------------------------------------------------------------
 1 | const reportWebVitals = (onPerfEntry) => {
 2 |   if (onPerfEntry && onPerfEntry instanceof Function) {
 3 |     import("web-vitals").then(({ getCLS, getFID, getFCP, getLCP, getTTFB }) => {
 4 |       getCLS(onPerfEntry);
 5 |       getFID(onPerfEntry);
 6 |       getFCP(onPerfEntry);
 7 |       getLCP(onPerfEntry);
 8 |       getTTFB(onPerfEntry);
 9 |     });
10 |   }
11 | };
12 | 
13 | export default reportWebVitals;
14 | 


--------------------------------------------------------------------------------
/chainforge/react-server/src/setupTests.js:
--------------------------------------------------------------------------------
1 | // jest-dom adds custom jest matchers for asserting on DOM nodes.
2 | // allows you to do things like:
3 | // expect(element).toHaveTextContent(/react/i)
4 | // learn more: https://github.com/testing-library/jest-dom
5 | import "@testing-library/jest-dom";
6 | 


--------------------------------------------------------------------------------
/chainforge/react-server/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "compilerOptions": {
 3 |     "target": "es6",
 4 |     "lib": ["dom", "dom.iterable", "esnext", "WebWorker"],
 5 |     "allowJs": true,
 6 |     "skipLibCheck": true,
 7 |     "esModuleInterop": true,
 8 |     "allowSyntheticDefaultImports": true,
 9 |     "strict": true,
10 |     "forceConsistentCasingInFileNames": false,
11 |     "noFallthroughCasesInSwitch": true,
12 |     "module": "esnext",
13 |     "moduleResolution": "node",
14 |     "resolveJsonModule": true,
15 |     "isolatedModules": true,
16 |     "noEmit": true,
17 |     "typeRoots": ["./node_modules/@types", "./types"],
18 |     "jsx": "react-jsx"
19 |   },
20 |   "include": ["src"]
21 | }
22 | 


--------------------------------------------------------------------------------
/chainforge/requirements.txt:
--------------------------------------------------------------------------------
 1 | flask>=2.2.3
 2 | flask[async]
 3 | flask_cors
 4 | requests
 5 | openai
 6 | urllib3==1.26.6
 7 | mistune>=2.0
 8 | platformdirs
 9 | cryptography
10 | markitdown[pdf, docx, xlsx, xls, pptx]


--------------------------------------------------------------------------------
/chainforge/security/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ianarawjo/ChainForge/0b22ad4e0bc0a18c5675157b1c8ff4b6e57b410d/chainforge/security/__init__.py


--------------------------------------------------------------------------------
/chainforge/security/password_utils.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import hashlib
 3 | import getpass
 4 | 
 5 | def get_password(prompt="🔐 Enter password: ") -> str:
 6 |   return getpass.getpass(prompt)
 7 | 
 8 | def hash_password(password: str, salt: bytes, iterations=100_000) -> bytes:
 9 |   return hashlib.pbkdf2_hmac('sha256', password.encode(), salt, iterations)
10 | 
11 | def save_password(password: str, hash_filepath: str):
12 |   salt = os.urandom(16)
13 |   hashed = hash_password(password, salt)
14 |   with open(hash_filepath, "wb") as f:
15 |     f.write(salt + hashed)
16 | 
17 | def verify_password(password: str, hash_filepath: str) -> bool:
18 |   with open(hash_filepath, "rb") as f:
19 |     data = f.read()
20 |   salt = data[:16]
21 |   stored_hash = data[16:]
22 |   test_hash = hash_password(password, salt)
23 |   return test_hash == stored_hash
24 | 
25 | def ensure_password(hash_filepath: str, create_new_msg: str = "") -> str:
26 |   if not os.path.exists(hash_filepath):
27 |     # First time setup
28 |     while True:
29 |       if create_new_msg:
30 |         print(create_new_msg)
31 |       pw1 = get_password("Create new password: ")
32 |       pw2 = get_password("Confirm password: ")
33 |       if len(pw1) < 8:
34 |         print("❌ Password must be at least 8 characters long. Try again.")
35 |         continue
36 |       if pw1 != pw2:
37 |         print("❌ Passwords do not match. Try again.")
38 |         continue
39 |       save_password(pw1, hash_filepath)
40 |       print("✅ Password set.")
41 |       return pw1
42 |   else:
43 |     # Verify password
44 |     for _ in range(3):  # Allow 3 tries
45 |       pw = get_password()
46 |       if verify_password(pw, hash_filepath):
47 |         print("✅ Password verified.")
48 |         return pw
49 |       print("❌ Incorrect password.")
50 |     print("Too many failed attempts. Exiting.")
51 |     exit(1)
52 | 


--------------------------------------------------------------------------------
/chainforge/security/secure_save.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | import os
  3 | import base64
  4 | from typing import Union, Tuple
  5 | from cryptography.hazmat.primitives.kdf.pbkdf2 import PBKDF2HMAC
  6 | from cryptography.hazmat.primitives import hashes
  7 | from cryptography.fernet import Fernet
  8 | 
  9 | def generate_key(password: str, salt: bytes) -> bytes:
 10 |   kdf = PBKDF2HMAC(
 11 |     algorithm=hashes.SHA256(),
 12 |     length=32,
 13 |     salt=salt,
 14 |     iterations=100_000,
 15 |   )
 16 |   return base64.urlsafe_b64encode(kdf.derive(password.encode()))
 17 | 
 18 | def load_json_file(filepath_w_ext: str, secure: bool, password: Union[str, None] = None) -> Tuple[Union[dict, None], Union[str, None]]:  
 19 |   """
 20 |     Load a JSON file. If secure is True, load the encrypted file and decrypt it using the provided password.
 21 |     If secure is False, load the plain JSON file.
 22 | 
 23 |     Returns a tuple of (data, filepath) where data is the loaded JSON data and filepath is the true path to the file.
 24 |   """
 25 |   enc_filepath = filepath_w_ext + ".enc"
 26 |   if secure and not os.path.exists(enc_filepath):
 27 |     print(f"❌ Encrypted file not found at path: {enc_filepath}. Looking for non-encrypted file at same path...")
 28 |     secure = False  # Fallback to load a non-encrypted file
 29 | 
 30 |   if not secure:
 31 |     if os.path.exists(filepath_w_ext):
 32 |       with open(filepath_w_ext, "r") as f:
 33 |         return json.load(f), filepath_w_ext
 34 |     print(f"❌ File not found at path: {filepath_w_ext}. Failed to load.")
 35 |     return None, None  # File not found
 36 | 
 37 |   if password is None or len(password) == 0:
 38 |     print("❌ Password is required for secure load. Please provide a password at application start.")
 39 |     return None, None  # Failure
 40 | 
 41 |   if not os.path.exists(enc_filepath):
 42 |     print(f"❌ Encrypted file not found at path: {enc_filepath}. Failed to load.")
 43 |     return None, None
 44 | 
 45 |   try:
 46 |     # Read the combined data (salt + encrypted data) from the file
 47 |     with open(enc_filepath, "rb") as f:
 48 |       combined_data = f.read()
 49 | 
 50 |     # Extract the salt (first 16 bytes) and the encrypted data
 51 |     salt = combined_data[:16]
 52 |     encrypted_data = combined_data[16:]
 53 | 
 54 |     # Generate the key using the password and salt
 55 |     key = generate_key(password, salt)
 56 |     # Create a Fernet object with the key
 57 |     fernet = Fernet(key)
 58 | 
 59 |     # Decrypt the data
 60 |     decrypted = fernet.decrypt(encrypted_data)
 61 |     return json.loads(decrypted), enc_filepath
 62 |   except Exception as e:
 63 |     print(f"❌ Failed to decrypt file: {enc_filepath}. Error: {e}")
 64 |     return None, None
 65 | 
 66 | def save_json_file(data: dict, filepath_w_ext: str, secure: bool, password: Union[str, None] = None) -> bool:
 67 |   """
 68 |     Save `data` to a JSON file. If secure is True, encrypt the file using the provided password.
 69 |     If secure is False, save the plain JSON file.
 70 |   """
 71 |   if not secure:
 72 |     try: 
 73 |       # Save the config to a JSON file
 74 |       with open(filepath_w_ext, "w") as f:
 75 |         json.dump(data, f, indent=2)
 76 |       return True  # Success
 77 |     except Exception as e:
 78 |       print(f"❌ Failed to save file: {filepath_w_ext}. Error: {e}")
 79 |       return False
 80 | 
 81 |   if password is None or len(password) == 0:
 82 |     print("❌ Password is required for secure save. Please provide a password at application start.")
 83 |     return False  # Failure
 84 | 
 85 |   # Filepath for encrypted config as extra .enc extension
 86 |   enc_filepath = filepath_w_ext + ".enc"
 87 | 
 88 |   # Generate a new salt
 89 |   salt = os.urandom(16)
 90 |   # Generate the key using the password and salt
 91 |   key = generate_key(password, salt) 
 92 |   # Create a Fernet object with the key
 93 |   fernet = Fernet(key)
 94 | 
 95 |   try:
 96 |     # Encrypt the data
 97 |     encrypted = fernet.encrypt(json.dumps(data).encode())
 98 |     # Combine the salt and encrypted data
 99 |     combined_data = salt + encrypted
100 |     # Write the combined data to the file
101 |     with open(enc_filepath, "wb") as f:
102 |       f.write(combined_data)
103 |     # If there is an existing unencrypted file at the non-.enc path, delete it.
104 |     # This is to remove the possibility of duplicates. 
105 |     if os.path.exists(filepath_w_ext):
106 |       os.remove(filepath_w_ext)
107 |     return True  # Success
108 |   except Exception as e:
109 |     print(f"❌ Failed to encrypt file: {enc_filepath}. Error: {e}")
110 |     return False
111 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | from setuptools import setup, find_packages
 2 | 
 3 | def readme():
 4 |     with open('README.md', encoding='utf-8') as f:
 5 |         return f.read()
 6 | 
 7 | setup(
 8 |     name="chainforge",
 9 |     version="0.3.6.1",
10 |     packages=find_packages(),
11 |     author="Ian Arawjo",
12 |     description="A Visual Programming Environment for Prompt Engineering",
13 |     long_description=readme(),
14 |     long_description_content_type="text/markdown",
15 |     keywords="prompt engineering LLM response evaluation",
16 |     license="MIT",
17 |     url="https://github.com/ianarawjo/ChainForge/",
18 |     install_requires=[
19 |         # Package dependencies
20 |         "flask>=2.2.3",
21 |         "flask[async]",
22 |         "flask_cors",
23 |         "requests",
24 |         "platformdirs",
25 |         "urllib3==1.26.6",
26 |         "openai",
27 |         "cryptography",
28 |         "mistune>=2.0",  # for LLM response markdown parsing
29 |         "markitdown[pdf, docx, xlsx, xls, pptx]",
30 |     ],
31 |     entry_points={
32 |         "console_scripts": [
33 |             "chainforge = chainforge.app:main",
34 |         ],
35 |     },
36 |     classifiers=[
37 |         # Package classifiers
38 |         "Development Status :: 3 - Alpha",
39 |         "Intended Audience :: Developers",
40 |         "License :: OSI Approved :: MIT License",
41 |         "Programming Language :: Python :: 3",
42 |         "Programming Language :: Python :: 3.10",
43 |         "Programming Language :: Python :: 3.11",
44 |         "Programming Language :: Python :: 3.12",
45 |     ],
46 |     python_requires=">=3.10",
47 |     include_package_data=True,
48 | )
49 | 


--------------------------------------------------------------------------------