├── .gitignore
├── README.md
├── dataset
├── AQuA
│ └── test.json
├── AddSub
│ └── AddSub.json
├── Bigbench_Date
│ └── task.json
├── Bigbench_object_tracking
│ └── task.json
├── CommonsenseQA
│ ├── dev_rand_split.jsonl
│ ├── test_rand_split_no_answers.jsonl
│ └── train_rand_split.jsonl
├── MultiArith
│ └── MultiArith.json
├── SVAMP
│ └── SVAMP.json
├── SingleEq
│ └── questions.json
├── StrategyQA
│ └── task.json
├── coin_flip
│ └── coin_flip.json
├── grade-school-math
│ └── test.jsonl
└── last_letters
│ └── last_letters.json
├── demos
├── addsub_gpt-3.5-turbo-0301
├── addsub_gpt-3.5-turbo-0301_10
├── addsub_gpt-3.5-turbo-0301_11
├── addsub_gpt-3.5-turbo-0301_12
├── addsub_gpt-3.5-turbo-0301_13
├── addsub_gpt-3.5-turbo-0301_14
├── addsub_gpt-3.5-turbo-0301_15
├── addsub_gpt-3.5-turbo-0301_16
├── addsub_gpt-3.5-turbo-0301_17
├── addsub_gpt-3.5-turbo-0301_18
├── addsub_gpt-3.5-turbo-0301_19
├── addsub_gpt-3.5-turbo-0301_20
├── addsub_gpt-3.5-turbo-0301_21
├── addsub_gpt-3.5-turbo-0301_22
├── addsub_gpt-3.5-turbo-0301_23
├── addsub_gpt-3.5-turbo-0301_24
├── addsub_gpt-3.5-turbo-0301_25
├── addsub_gpt-3.5-turbo-0301_26
├── addsub_gpt-3.5-turbo-0301_27
├── addsub_gpt-3.5-turbo-0301_28
├── addsub_gpt-3.5-turbo-0301_29
├── addsub_gpt-3.5-turbo-0301_30
├── addsub_gpt-3.5-turbo-0301_31
├── addsub_gpt-3.5-turbo-0301_32
├── addsub_gpt-3.5-turbo-0301_8
├── addsub_gpt-3.5-turbo-0301_9
├── addsub_manual
├── aqua_gpt-3.5-turbo-0301
├── aqua_gpt-3.5-turbo-0301_10
├── aqua_gpt-3.5-turbo-0301_11
├── aqua_gpt-3.5-turbo-0301_12
├── aqua_gpt-3.5-turbo-0301_13
├── aqua_gpt-3.5-turbo-0301_14
├── aqua_gpt-3.5-turbo-0301_15
├── aqua_gpt-3.5-turbo-0301_16
├── aqua_gpt-3.5-turbo-0301_17
├── aqua_gpt-3.5-turbo-0301_18
├── aqua_gpt-3.5-turbo-0301_19
├── aqua_gpt-3.5-turbo-0301_20
├── aqua_gpt-3.5-turbo-0301_21
├── aqua_gpt-3.5-turbo-0301_22
├── aqua_gpt-3.5-turbo-0301_23
├── aqua_gpt-3.5-turbo-0301_24
├── aqua_gpt-3.5-turbo-0301_25
├── aqua_gpt-3.5-turbo-0301_26
├── aqua_gpt-3.5-turbo-0301_27
├── aqua_gpt-3.5-turbo-0301_28
├── aqua_gpt-3.5-turbo-0301_29
├── aqua_gpt-3.5-turbo-0301_30
├── aqua_gpt-3.5-turbo-0301_31
├── aqua_gpt-3.5-turbo-0301_32
├── aqua_gpt-3.5-turbo-0301_8
├── aqua_gpt-3.5-turbo-0301_9
├── aqua_manual
├── coin_flip_gpt-3.5-turbo-0301
├── coin_flip_gpt-3.5-turbo-0301_10
├── coin_flip_gpt-3.5-turbo-0301_11
├── coin_flip_gpt-3.5-turbo-0301_12
├── coin_flip_gpt-3.5-turbo-0301_13
├── coin_flip_gpt-3.5-turbo-0301_14
├── coin_flip_gpt-3.5-turbo-0301_15
├── coin_flip_gpt-3.5-turbo-0301_16
├── coin_flip_gpt-3.5-turbo-0301_17
├── coin_flip_gpt-3.5-turbo-0301_18
├── coin_flip_gpt-3.5-turbo-0301_19
├── coin_flip_gpt-3.5-turbo-0301_20
├── coin_flip_gpt-3.5-turbo-0301_21
├── coin_flip_gpt-3.5-turbo-0301_22
├── coin_flip_gpt-3.5-turbo-0301_23
├── coin_flip_gpt-3.5-turbo-0301_24
├── coin_flip_gpt-3.5-turbo-0301_25
├── coin_flip_gpt-3.5-turbo-0301_26
├── coin_flip_gpt-3.5-turbo-0301_27
├── coin_flip_gpt-3.5-turbo-0301_28
├── coin_flip_gpt-3.5-turbo-0301_29
├── coin_flip_gpt-3.5-turbo-0301_30
├── coin_flip_gpt-3.5-turbo-0301_31
├── coin_flip_gpt-3.5-turbo-0301_32
├── coin_flip_gpt-3.5-turbo-0301_8
├── coin_flip_gpt-3.5-turbo-0301_9
├── coin_flip_manual
├── commonsensqa_gpt-3.5-turbo-0301
├── commonsensqa_gpt-3.5-turbo-0301_10
├── commonsensqa_gpt-3.5-turbo-0301_11
├── commonsensqa_gpt-3.5-turbo-0301_12
├── commonsensqa_gpt-3.5-turbo-0301_13
├── commonsensqa_gpt-3.5-turbo-0301_14
├── commonsensqa_gpt-3.5-turbo-0301_15
├── commonsensqa_gpt-3.5-turbo-0301_16
├── commonsensqa_gpt-3.5-turbo-0301_17
├── commonsensqa_gpt-3.5-turbo-0301_18
├── commonsensqa_gpt-3.5-turbo-0301_19
├── commonsensqa_gpt-3.5-turbo-0301_20
├── commonsensqa_gpt-3.5-turbo-0301_21
├── commonsensqa_gpt-3.5-turbo-0301_22
├── commonsensqa_gpt-3.5-turbo-0301_23
├── commonsensqa_gpt-3.5-turbo-0301_24
├── commonsensqa_gpt-3.5-turbo-0301_25
├── commonsensqa_gpt-3.5-turbo-0301_26
├── commonsensqa_gpt-3.5-turbo-0301_27
├── commonsensqa_gpt-3.5-turbo-0301_28
├── commonsensqa_gpt-3.5-turbo-0301_29
├── commonsensqa_gpt-3.5-turbo-0301_30
├── commonsensqa_gpt-3.5-turbo-0301_31
├── commonsensqa_gpt-3.5-turbo-0301_32
├── commonsensqa_gpt-3.5-turbo-0301_8
├── commonsensqa_gpt-3.5-turbo-0301_9
├── commonsensqa_manual
├── gsm8k_gpt-3.5-turbo-0301
├── gsm8k_gpt-3.5-turbo-0301_10
├── gsm8k_gpt-3.5-turbo-0301_11
├── gsm8k_gpt-3.5-turbo-0301_12
├── gsm8k_gpt-3.5-turbo-0301_13
├── gsm8k_gpt-3.5-turbo-0301_14
├── gsm8k_gpt-3.5-turbo-0301_15
├── gsm8k_gpt-3.5-turbo-0301_16
├── gsm8k_gpt-3.5-turbo-0301_17
├── gsm8k_gpt-3.5-turbo-0301_18
├── gsm8k_gpt-3.5-turbo-0301_19
├── gsm8k_gpt-3.5-turbo-0301_20
├── gsm8k_gpt-3.5-turbo-0301_21
├── gsm8k_gpt-3.5-turbo-0301_22
├── gsm8k_gpt-3.5-turbo-0301_23
├── gsm8k_gpt-3.5-turbo-0301_24
├── gsm8k_gpt-3.5-turbo-0301_25
├── gsm8k_gpt-3.5-turbo-0301_26
├── gsm8k_gpt-3.5-turbo-0301_27
├── gsm8k_gpt-3.5-turbo-0301_28
├── gsm8k_gpt-3.5-turbo-0301_29
├── gsm8k_gpt-3.5-turbo-0301_30
├── gsm8k_gpt-3.5-turbo-0301_31
├── gsm8k_gpt-3.5-turbo-0301_32
├── gsm8k_gpt-3.5-turbo-0301_8
├── gsm8k_gpt-3.5-turbo-0301_9
├── gsm8k_manual
├── last_letters_gpt-3.5-turbo-0301
├── last_letters_gpt-3.5-turbo-0301_10
├── last_letters_gpt-3.5-turbo-0301_11
├── last_letters_gpt-3.5-turbo-0301_12
├── last_letters_gpt-3.5-turbo-0301_13
├── last_letters_gpt-3.5-turbo-0301_14
├── last_letters_gpt-3.5-turbo-0301_15
├── last_letters_gpt-3.5-turbo-0301_16
├── last_letters_gpt-3.5-turbo-0301_17
├── last_letters_gpt-3.5-turbo-0301_18
├── last_letters_gpt-3.5-turbo-0301_19
├── last_letters_gpt-3.5-turbo-0301_20
├── last_letters_gpt-3.5-turbo-0301_21
├── last_letters_gpt-3.5-turbo-0301_22
├── last_letters_gpt-3.5-turbo-0301_23
├── last_letters_gpt-3.5-turbo-0301_24
├── last_letters_gpt-3.5-turbo-0301_25
├── last_letters_gpt-3.5-turbo-0301_26
├── last_letters_gpt-3.5-turbo-0301_27
├── last_letters_gpt-3.5-turbo-0301_28
├── last_letters_gpt-3.5-turbo-0301_29
├── last_letters_gpt-3.5-turbo-0301_30
├── last_letters_gpt-3.5-turbo-0301_31
├── last_letters_gpt-3.5-turbo-0301_32
├── last_letters_gpt-3.5-turbo-0301_8
├── last_letters_gpt-3.5-turbo-0301_9
├── last_letters_manual
├── multiarith
├── multiarith_auto
├── multiarith_gpt-3.5-turbo-0301
├── multiarith_gpt-3.5-turbo-0301_10
├── multiarith_gpt-3.5-turbo-0301_11
├── multiarith_gpt-3.5-turbo-0301_12
├── multiarith_gpt-3.5-turbo-0301_13
├── multiarith_gpt-3.5-turbo-0301_14
├── multiarith_gpt-3.5-turbo-0301_15
├── multiarith_gpt-3.5-turbo-0301_16
├── multiarith_gpt-3.5-turbo-0301_17
├── multiarith_gpt-3.5-turbo-0301_18
├── multiarith_gpt-3.5-turbo-0301_19
├── multiarith_gpt-3.5-turbo-0301_20
├── multiarith_gpt-3.5-turbo-0301_21
├── multiarith_gpt-3.5-turbo-0301_22
├── multiarith_gpt-3.5-turbo-0301_23
├── multiarith_gpt-3.5-turbo-0301_24
├── multiarith_gpt-3.5-turbo-0301_25
├── multiarith_gpt-3.5-turbo-0301_26
├── multiarith_gpt-3.5-turbo-0301_27
├── multiarith_gpt-3.5-turbo-0301_28
├── multiarith_gpt-3.5-turbo-0301_29
├── multiarith_gpt-3.5-turbo-0301_30
├── multiarith_gpt-3.5-turbo-0301_31
├── multiarith_gpt-3.5-turbo-0301_32
├── multiarith_gpt-3.5-turbo-0301_8
├── multiarith_gpt-3.5-turbo-0301_9
├── multiarith_manual
├── singleeq_gpt-3.5-turbo-0301
├── singleeq_gpt-3.5-turbo-0301_10
├── singleeq_gpt-3.5-turbo-0301_11
├── singleeq_gpt-3.5-turbo-0301_12
├── singleeq_gpt-3.5-turbo-0301_13
├── singleeq_gpt-3.5-turbo-0301_14
├── singleeq_gpt-3.5-turbo-0301_15
├── singleeq_gpt-3.5-turbo-0301_16
├── singleeq_gpt-3.5-turbo-0301_17
├── singleeq_gpt-3.5-turbo-0301_18
├── singleeq_gpt-3.5-turbo-0301_19
├── singleeq_gpt-3.5-turbo-0301_20
├── singleeq_gpt-3.5-turbo-0301_21
├── singleeq_gpt-3.5-turbo-0301_22
├── singleeq_gpt-3.5-turbo-0301_23
├── singleeq_gpt-3.5-turbo-0301_24
├── singleeq_gpt-3.5-turbo-0301_25
├── singleeq_gpt-3.5-turbo-0301_26
├── singleeq_gpt-3.5-turbo-0301_27
├── singleeq_gpt-3.5-turbo-0301_28
├── singleeq_gpt-3.5-turbo-0301_29
├── singleeq_gpt-3.5-turbo-0301_30
├── singleeq_gpt-3.5-turbo-0301_31
├── singleeq_gpt-3.5-turbo-0301_32
├── singleeq_gpt-3.5-turbo-0301_8
├── singleeq_gpt-3.5-turbo-0301_9
├── singleeq_manual
├── strategyqa_gpt-3.5-turbo-0301
├── strategyqa_gpt-3.5-turbo-0301_10
├── strategyqa_gpt-3.5-turbo-0301_11
├── strategyqa_gpt-3.5-turbo-0301_12
├── strategyqa_gpt-3.5-turbo-0301_13
├── strategyqa_gpt-3.5-turbo-0301_14
├── strategyqa_gpt-3.5-turbo-0301_15
├── strategyqa_gpt-3.5-turbo-0301_16
├── strategyqa_gpt-3.5-turbo-0301_17
├── strategyqa_gpt-3.5-turbo-0301_18
├── strategyqa_gpt-3.5-turbo-0301_19
├── strategyqa_gpt-3.5-turbo-0301_20
├── strategyqa_gpt-3.5-turbo-0301_21
├── strategyqa_gpt-3.5-turbo-0301_22
├── strategyqa_gpt-3.5-turbo-0301_23
├── strategyqa_gpt-3.5-turbo-0301_24
├── strategyqa_gpt-3.5-turbo-0301_25
├── strategyqa_gpt-3.5-turbo-0301_26
├── strategyqa_gpt-3.5-turbo-0301_27
├── strategyqa_gpt-3.5-turbo-0301_28
├── strategyqa_gpt-3.5-turbo-0301_29
├── strategyqa_gpt-3.5-turbo-0301_30
├── strategyqa_gpt-3.5-turbo-0301_31
├── strategyqa_gpt-3.5-turbo-0301_32
├── strategyqa_gpt-3.5-turbo-0301_8
├── strategyqa_gpt-3.5-turbo-0301_9
├── strategyqa_manual
├── svamp_gpt-3.5-turbo-0301
├── svamp_gpt-3.5-turbo-0301_10
├── svamp_gpt-3.5-turbo-0301_11
├── svamp_gpt-3.5-turbo-0301_12
├── svamp_gpt-3.5-turbo-0301_13
├── svamp_gpt-3.5-turbo-0301_14
├── svamp_gpt-3.5-turbo-0301_15
├── svamp_gpt-3.5-turbo-0301_16
├── svamp_gpt-3.5-turbo-0301_17
├── svamp_gpt-3.5-turbo-0301_18
├── svamp_gpt-3.5-turbo-0301_19
├── svamp_gpt-3.5-turbo-0301_20
├── svamp_gpt-3.5-turbo-0301_21
├── svamp_gpt-3.5-turbo-0301_22
├── svamp_gpt-3.5-turbo-0301_23
├── svamp_gpt-3.5-turbo-0301_24
├── svamp_gpt-3.5-turbo-0301_25
├── svamp_gpt-3.5-turbo-0301_26
├── svamp_gpt-3.5-turbo-0301_27
├── svamp_gpt-3.5-turbo-0301_28
├── svamp_gpt-3.5-turbo-0301_29
├── svamp_gpt-3.5-turbo-0301_30
├── svamp_gpt-3.5-turbo-0301_31
├── svamp_gpt-3.5-turbo-0301_32
├── svamp_gpt-3.5-turbo-0301_8
├── svamp_gpt-3.5-turbo-0301_9
└── svamp_manual
├── echo.webp
├── log
├── addsub_gpt-3.5-turbo-0301_zero_shot_cot.log
├── aqua_gpt-3.5-turbo-0301_zero_shot_cot.log
├── coin_flip_gpt-3.5-turbo-0301_zero_shot_cot.log
├── commonsensqa_gpt-3.5-turbo-0301_zero_shot_cot.log
├── gsm8k_gpt-3.5-turbo-0301_zero_shot_cot.log
├── last_letters_gpt-3.5-turbo-0301_zero_shot_cot.log
├── multiarith_gpt-3.5-turbo-0301_zero_shot_cot.log
├── singleeq_gpt-3.5-turbo-0301_zero_shot_cot.log
├── strategyqa_gpt-3.5-turbo-0301_zero_shot_cot.log
└── svamp_gpt-3.5-turbo-0301_zero_shot_cot.log
├── run
├── create_demos.sh
├── create_log.sh
├── run_echo.sh
└── run_echo_max.sh
├── run_ECHO.py
├── run_ECHO_max.py
├── run_demo.py
├── run_inference.py
├── run_inference_mistral_api.py
├── run_inference_parallel.py
├── utils.py
└── zero_shot_cot.py
/.gitignore:
--------------------------------------------------------------------------------
1 | # Byte-compiled / optimized / DLL files
2 | __pycache__/
3 | *.py[cod]
4 | *$py.class
5 |
6 | # C extensions
7 | *.so
8 |
9 | # Distribution / packaging
10 | .Python
11 | build/
12 | develop-eggs/
13 | dist/
14 | downloads/
15 | eggs/
16 | .eggs/
17 | lib/
18 | lib64/
19 | parts/
20 | sdist/
21 | var/
22 | wheels/
23 | share/python-wheels/
24 | *.egg-info/
25 | .installed.cfg
26 | *.egg
27 | MANIFEST
28 |
29 | # PyInstaller
30 | # Usually these files are written by a python script from a template
31 | # before PyInstaller builds the exe, so as to inject date/other infos into it.
32 | *.manifest
33 | *.spec
34 |
35 | # Installer logs
36 | pip-log.txt
37 | pip-delete-this-directory.txt
38 |
39 | # Unit test / coverage reports
40 | htmlcov/
41 | .tox/
42 | .nox/
43 | .coverage
44 | .coverage.*
45 | .cache
46 | nosetests.xml
47 | coverage.xml
48 | *.cover
49 | *.py,cover
50 | .hypothesis/
51 | .pytest_cache/
52 | cover/
53 |
54 | # Translations
55 | *.mo
56 | *.pot
57 |
58 | # Django stuff:
59 | local_settings.py
60 | db.sqlite3
61 | db.sqlite3-journal
62 |
63 | # Flask stuff:
64 | instance/
65 | .webassets-cache
66 |
67 | # Scrapy stuff:
68 | .scrapy
69 |
70 | # Sphinx documentation
71 | docs/_build/
72 |
73 | # PyBuilder
74 | .pybuilder/
75 | target/
76 |
77 | # Jupyter Notebook
78 | .ipynb_checkpoints
79 |
80 | # IPython
81 | profile_default/
82 | ipython_config.py
83 |
84 | # pyenv
85 | # For a library or package, you might want to ignore these files since the code is
86 | # intended to run in multiple environments; otherwise, check them in:
87 | # .python-version
88 |
89 | # pipenv
90 | # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
91 | # However, in case of collaboration, if having platform-specific dependencies or dependencies
92 | # having no cross-platform support, pipenv may install dependencies that don't work, or not
93 | # install all needed dependencies.
94 | #Pipfile.lock
95 |
96 | # poetry
97 | # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
98 | # This is especially recommended for binary packages to ensure reproducibility, and is more
99 | # commonly ignored for libraries.
100 | # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
101 | #poetry.lock
102 |
103 | # pdm
104 | # Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
105 | #pdm.lock
106 | # pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
107 | # in version control.
108 | # https://pdm.fming.dev/#use-with-ide
109 | .pdm.toml
110 |
111 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
112 | __pypackages__/
113 |
114 | # Celery stuff
115 | celerybeat-schedule
116 | celerybeat.pid
117 |
118 | # SageMath parsed files
119 | *.sage.py
120 |
121 | # Environments
122 | .env
123 | .venv
124 | env/
125 | venv/
126 | ENV/
127 | env.bak/
128 | venv.bak/
129 |
130 | # Spyder project settings
131 | .spyderproject
132 | .spyproject
133 |
134 | # Rope project settings
135 | .ropeproject
136 |
137 | # mkdocs documentation
138 | /site
139 |
140 | # mypy
141 | .mypy_cache/
142 | .dmypy.json
143 | dmypy.json
144 |
145 | # Pyre type checker
146 | .pyre/
147 |
148 | # pytype static type analyzer
149 | .pytype/
150 |
151 | # Cython debug symbols
152 | cython_debug/
153 |
154 | # PyCharm
155 | # JetBrains specific template is maintained in a separate JetBrains.gitignore that can
156 | # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
157 | # and can be added to the global gitignore or merged into this file. For a more nuclear
158 | # option (not recommended) you can uncomment the following to ignore the entire idea folder.
159 | #.idea/
160 | ECHO_demos/
161 | demos/aqua_gpt-4o_4
162 | demos/gsm8k_gpt-4o_32
163 | demos/gsm8k_gpt-4o_8
164 | experiment/
165 | gpt4o_test.py
166 | run/run_echo_4o.sh
167 | run/run_echo_4oo.sh
--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | # ECHO
2 | Official homepage for "s**E**lf-Harmonized **C**hain of t**HO**ught" https://www.arxiv.org/abs/2409.04057 . (Accepted by NAACL 2025 main)
3 |
4 | [_UPDATE_ **Nov-25-2024** : We update parallel OPENAI inference code to speed up the inference speed by x20!!! Simply replace run_inference.py with **run_inference_parallel.py** to use it.]
5 |
6 | [_UPDATE_ Sept-19-2024 : We found the log is not upload due to wrong .gitignore ; Re-upload the log, you can now create your own demonstrations!!! ]
7 |
8 | [_UPDATE_ Sept-16-2024 : We update the code to fit to the lastest OPENAI version, as requested by issue. We also share the log and demo to save your effort.]
9 |
10 | [_UPDATE_ Feb-16-2024 : First Submission.]
11 |
12 |
13 |

14 |
15 |
16 | ## Get Started
17 |
18 | Please install the latest __openai__ and __torch__
19 |
20 | Set your API:
21 |
22 | ```
23 | export OPENAI_API_KEY=(YOUR OPENAI API KEY)
24 | ```
25 |
26 | Similarly, you should set MISTRAL_API_KEY if you want to use the MISTRAL models.
27 |
28 | ### Step to reproduce main experiment results
29 |
30 | (Optional) **Step 0: Log Creation**
31 |
32 | We have created the log for you using Zero-Shot CoT. This serves as an initialization of our method. If you are using other models, you may consider running this.
33 |
34 | Note that this is not compulsory, as the demo selection will only depend on the question, not the rationale. You can skip this step and directly regenerate the rationale using your model.
35 | ```
36 | source run/crate_log.sh
37 | ```
38 |
39 | **Step 1: DEMO creation**
40 |
41 | We follow Auto-CoT to use the clustering, and then select one question from each cluster.
42 | As k=max requires maximum number of demonstration allowed by context length, we generate a number of 8 to 32 demonstrations for each dataset. If you are not running k=max case, you can generate only 8 demonstrations.
43 |
44 | ```
45 | source run/create_demos.sh
46 | ```
47 |
48 | **Step 2: RUN ECHO~!**
49 |
50 | Now you can run ECHO with
51 | ```
52 | source run/run_echo.sh
53 | ```
54 |
55 | This script creates the demo with ECHO;
56 |
57 | **Step 3: RUN ECHO (k=max)**
58 |
59 | ```
60 | source run/run_echo_max.sh
61 | ```
62 |
63 | This script creates the demo with ECHO(k=max); This script will test the maximum number of demonstrations allowed by context window size iteratively, starting from 32 to 8;
64 |
65 | **Step 4: run inference**
66 |
67 | We attached the inference code after run_echo.sh and run_echo_max.sh
68 | If you want to test Auto-CoT, please use the demo:
69 | ```
70 | demos/{dataset}_{model_name}
71 | ```
72 | If you want to test manual prompt (from Few-shot-CoT), please use the demo:
73 | ```
74 | demos/{dataset}_manual
75 | ```
76 | We suggest **T=4** for optimal performance. However, we found that an easier and less diverse dataset may require less iteration.
77 |
78 | You can replace "singleeq" to any other datasets we included: "aqua", "gsm8k", "commonsensqa", "addsub", "multiarith", "strategyqa", "svamp", "singleeq", "coin_flip", "last_letters"
79 |
80 | We also include the code for inferencing Mistral API.
81 |
82 | If you have any question, please consider raise an issue or directly email Ziqi.
83 |
84 | ## Some Intuition
85 |
86 | There are multiple intuitions which I'd like to share after finishing this paper:
87 |
88 | (1) The unified demonstrations will better match the case in the pre-training data of the model, where contexts from the same piece are mutually relevant and consistent.
89 |
90 | (2) Cognitive Load Theory (by John Sweller): learning is most effective when the cognitive load on working memory is minimized. If all demonstrations are coherent, it is easier to learn the pattern and follow both humans and models.
91 |
92 | (3) You can also explain this with the Entropy Theory: unified demos reduce the information entropy (disorder and uncertainty), thus increasing the predictability.
93 |
94 | ## Acknowledgement
95 |
96 | This repo is built on repos of Auto-CoT and Zero-shot-CoT.
97 |
98 | ## Citation
99 |
100 | To cite our paper, please include the following bibtex:
101 |
102 | ```
103 | @inproceedings{jin2024selfharmonizedchainthought,
104 | title={Self-Harmonized Chain of Thought},
105 | author={Ziqi Jin and Wei Lu},
106 | booktitle={Proceedings of the NAACL},
107 | year={2025},
108 | url={https://arxiv.org/abs/2409.04057},
109 | }
110 | ```
111 |
--------------------------------------------------------------------------------
/demos/addsub_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Mary found 18 seashells and Jessica found 41 seashells on the beach . How many seashells did they find together ?\nA:",
5 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of seashells Mary found to the number of seashells Jessica found. 18 + 41 = 59 So, Mary and Jessica found a total of 59 seashells together.",
6 | "pred_ans": "59",
7 | "gold_ans": "59"
8 | },
9 | {
10 | "question": "Q: Jason grew 23 watermelons and 18 turnips . Nancy grew 28 watermelons . How many watermelons did they grow in total ?\nA:",
11 | "rationale": "Let's think step by step. First, we need to add up the number of watermelons that Jason and Nancy grew. Jason grew 23 watermelons and Nancy grew 28 watermelons, so the total number of watermelons is: 23 + 28 = 51 Therefore, they grew a total of 51 watermelons.",
12 | "pred_ans": "51",
13 | "gold_ans": "51"
14 | },
15 | {
16 | "question": "Q: Sam had 49 pennies and 24 nickels in his bank . His dad gave him 39 nickels and 31 quarters . How many nickels does he have now ?\nA:",
17 | "rationale": "Let's think step by step. First, we need to find out how many total nickels Sam had before his dad gave him more. Sam had 24 nickels to start with, and his dad gave him 39 more nickels. So, Sam now has a total of 24 + 39 = 63 nickels.",
18 | "pred_ans": "63",
19 | "gold_ans": "63"
20 | },
21 | {
22 | "question": "Q: Last week Tim had 12 dollars and Keith had 36 dollars . Tim washed cars over the weekend and now has 75 dollars . How much money did Tim make washing cars ?\nA:",
23 | "rationale": "Let's think step by step. First, we need to find out how much money Tim made by subtracting his initial amount from his final amount. 75 - 12 = 63 This means that Tim made 63 dollars by washing cars over the weekend.",
24 | "pred_ans": "63",
25 | "gold_ans": "63"
26 | },
27 | {
28 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins . How many pounds of snacks did she buy in all ?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
30 | "pred_ans": "0.5",
31 | "gold_ans": "0.5"
32 | },
33 | {
34 | "question": "Q: Sam has 86 yellow and 20 green marbles . Joan took 25 of Sam 's yellow marbles . How many yellow marbles does Sam now have ?\nA:",
35 | "rationale": "Let's think step by step. First, we need to subtract the 25 yellow marbles that Joan took from Sam's original 86 yellow marbles. 86 - 25 = 61 So Sam now has 61 yellow marbles.",
36 | "pred_ans": "61",
37 | "gold_ans": "61"
38 | },
39 | {
40 | "question": "Q: There are 34 dogwood trees currently in the park . Park workers will plant 49 dogwood trees today . How many dogwood trees will the park have when the workers are finished ?\nA:",
41 | "rationale": "Let's think step by step. First, we need to add the number of dogwood trees currently in the park to the number of trees that will be planted today. So, we can write it as: 34 (current trees) + 49 (newly planted trees) = 83 Therefore, the park will have 83 dogwood trees when the workers are finished planting.",
42 | "pred_ans": "83",
43 | "gold_ans": "83"
44 | },
45 | {
46 | "question": "Q: There are 33 pencils and 44 crayons in the drawer . Joan placed 27 pencils in the drawer . How many pencils are now there in total ?\nA:",
47 | "rationale": "Let's think step by step. First, we need to add the number of pencils that were already in the drawer (33) to the number of pencils Joan placed in the drawer (27). 33 + 27 = 60 So there are now 60 pencils in the drawer.",
48 | "pred_ans": "60",
49 | "gold_ans": "60"
50 | }
51 | ]
52 | }
--------------------------------------------------------------------------------
/demos/addsub_gpt-3.5-turbo-0301_10:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There are 34 dogwood trees currently in the park . Park workers will plant 49 dogwood trees today . How many dogwood trees will the park have when the workers are finished ?\nA:",
5 | "rationale": "Let's think step by step. First, we need to add the number of dogwood trees currently in the park to the number of trees that will be planted today. So, we can write it as: 34 (current trees) + 49 (newly planted trees) = 83 Therefore, the park will have 83 dogwood trees when the workers are finished planting.",
6 | "pred_ans": "83",
7 | "gold_ans": "83"
8 | },
9 | {
10 | "question": "Q: Sam had 49 pennies and 24 nickels in his bank . His dad gave him 39 nickels and 31 quarters . How many nickels does he have now ?\nA:",
11 | "rationale": "Let's think step by step. First, we need to find out how many total nickels Sam had before his dad gave him more. Sam had 24 nickels to start with, and his dad gave him 39 more nickels. So, Sam now has a total of 24 + 39 = 63 nickels.",
12 | "pred_ans": "63",
13 | "gold_ans": "63"
14 | },
15 | {
16 | "question": "Q: Sam has 86 yellow and 20 green marbles . Joan took 25 of Sam 's yellow marbles . How many yellow marbles does Sam now have ?\nA:",
17 | "rationale": "Let's think step by step. First, we need to subtract the 25 yellow marbles that Joan took from Sam's original 86 yellow marbles. 86 - 25 = 61 So Sam now has 61 yellow marbles.",
18 | "pred_ans": "61",
19 | "gold_ans": "61"
20 | },
21 | {
22 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins . How many pounds of snacks did she buy in all ?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
24 | "pred_ans": "0.5",
25 | "gold_ans": "0.5"
26 | },
27 | {
28 | "question": "Q: Jason grew 23 watermelons and 18 turnips . Nancy grew 28 watermelons . How many watermelons did they grow in total ?\nA:",
29 | "rationale": "Let's think step by step. First, we need to add up the number of watermelons that Jason and Nancy grew. Jason grew 23 watermelons and Nancy grew 28 watermelons, so the total number of watermelons is: 23 + 28 = 51 Therefore, they grew a total of 51 watermelons.",
30 | "pred_ans": "51",
31 | "gold_ans": "51"
32 | },
33 | {
34 | "question": "Q: Mary found 18 seashells and Jessica found 41 seashells on the beach . How many seashells did they find together ?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of seashells Mary found to the number of seashells Jessica found. 18 + 41 = 59 So, Mary and Jessica found a total of 59 seashells together.",
36 | "pred_ans": "59",
37 | "gold_ans": "59"
38 | },
39 | {
40 | "question": "Q: Last week Tim had 12 dollars and Keith had 36 dollars . Tim washed cars over the weekend and now has 75 dollars . How much money did Tim make washing cars ?\nA:",
41 | "rationale": "Let's think step by step. First, we need to find out how much money Tim made by subtracting his initial amount from his final amount. 75 - 12 = 63 This means that Tim made 63 dollars by washing cars over the weekend.",
42 | "pred_ans": "63",
43 | "gold_ans": "63"
44 | },
45 | {
46 | "question": "Q: Alyssa 's cat had 8 kittens and 8 had spots . She gave 4 to her friends . How many kittens does she now have ?\nA:",
47 | "rationale": "Let's think step by step. Alyssa originally had 8 kittens, and 8 of them had spots. So, she had 8 spotted kittens. Then, she gave 4 of them to her friends. So, she now has 8 - 4 = 4 spotted kittens left. Therefore, Alyssa now has 4 kittens.",
48 | "pred_ans": "4",
49 | "gold_ans": "4"
50 | },
51 | {
52 | "question": "Q: Eve ran 0.7 mile and walked 0.6 mile . How much farther did Eve run than walk ?\nA:",
53 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the difference between the distance Eve ran and walked. To do this, we can subtract the distance she walked from the distance she ran: 0.7 miles - 0.6 miles = 0.1 miles Therefore, Eve ran 0.1 miles farther than she walked.",
54 | "pred_ans": "0.1",
55 | "gold_ans": "0.1"
56 | },
57 | {
58 | "question": "Q: There are 33 pencils and 44 crayons in the drawer . Joan placed 27 pencils in the drawer . How many pencils are now there in total ?\nA:",
59 | "rationale": "Let's think step by step. First, we need to add the number of pencils that were already in the drawer (33) to the number of pencils Joan placed in the drawer (27). 33 + 27 = 60 So there are now 60 pencils in the drawer.",
60 | "pred_ans": "60",
61 | "gold_ans": "60"
62 | }
63 | ],
64 | "inertia": 157.30648803710938
65 | }
--------------------------------------------------------------------------------
/demos/addsub_gpt-3.5-turbo-0301_11:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There are 34 dogwood trees currently in the park . Park workers will plant 49 dogwood trees today . How many dogwood trees will the park have when the workers are finished ?\nA:",
5 | "rationale": "Let's think step by step. First, we need to add the number of dogwood trees currently in the park to the number of trees that will be planted today. So, we can write it as: 34 (current trees) + 49 (newly planted trees) = 83 Therefore, the park will have 83 dogwood trees when the workers are finished planting.",
6 | "pred_ans": "83",
7 | "gold_ans": "83"
8 | },
9 | {
10 | "question": "Q: Last week Tim had 12 dollars and Keith had 36 dollars . Tim washed cars over the weekend and now has 75 dollars . How much money did Tim make washing cars ?\nA:",
11 | "rationale": "Let's think step by step. First, we need to find out how much money Tim made by subtracting his initial amount from his final amount. 75 - 12 = 63 This means that Tim made 63 dollars by washing cars over the weekend.",
12 | "pred_ans": "63",
13 | "gold_ans": "63"
14 | },
15 | {
16 | "question": "Q: Sam had 49 pennies and 24 nickels in his bank . His dad gave him 39 nickels and 31 quarters . How many nickels does he have now ?\nA:",
17 | "rationale": "Let's think step by step. First, we need to find out how many total nickels Sam had before his dad gave him more. Sam had 24 nickels to start with, and his dad gave him 39 more nickels. So, Sam now has a total of 24 + 39 = 63 nickels.",
18 | "pred_ans": "63",
19 | "gold_ans": "63"
20 | },
21 | {
22 | "question": "Q: Eve ran 0.7 mile and walked 0.6 mile . How much farther did Eve run than walk ?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the difference between the distance Eve ran and walked. To do this, we can subtract the distance she walked from the distance she ran: 0.7 miles - 0.6 miles = 0.1 miles Therefore, Eve ran 0.1 miles farther than she walked.",
24 | "pred_ans": "0.1",
25 | "gold_ans": "0.1"
26 | },
27 | {
28 | "question": "Q: There are 33 pencils and 44 crayons in the drawer . Joan placed 27 pencils in the drawer . How many pencils are now there in total ?\nA:",
29 | "rationale": "Let's think step by step. First, we need to add the number of pencils that were already in the drawer (33) to the number of pencils Joan placed in the drawer (27). 33 + 27 = 60 So there are now 60 pencils in the drawer.",
30 | "pred_ans": "60",
31 | "gold_ans": "60"
32 | },
33 | {
34 | "question": "Q: Melanie had 30 baseball cards , and 9 were torn . Sara bought 18 of Melanie 's baseball cards . How many baseball cards does Melanie have now ?\nA:",
35 | "rationale": "Let's think step by step. First, we need to find out how many baseball cards Melanie has after 9 were torn. Melanie had 30 baseball cards - 9 torn = 21 baseball cards. Next, we need to find out how many baseball cards Melanie has after Sara bought 18 of them. Melanie had 21 baseball cards - 18 bought by Sara = 3 baseball cards. Therefore, Melanie has 3 baseball cards now.",
36 | "pred_ans": "3",
37 | "gold_ans": "12"
38 | },
39 | {
40 | "question": "Q: Sara picked 35 pears and 27 apples from the orchard . She gave 28 pears to Dan . How many pears does Sara have ?\nA:",
41 | "rationale": "Let's think step by step. First, we need to find out how many pears Sara has after giving 28 to Dan. To do this, we can subtract 28 from the original number of pears she picked: 35 pears - 28 pears = 7 pears So after giving 28 pears to Dan, Sara has 7 pears left.",
42 | "pred_ans": "7",
43 | "gold_ans": "7"
44 | },
45 | {
46 | "question": "Q: Joan grew 8 watermelons and 4 turnips . Tom grew 9 watermelons . How many watermelons did they grow in total ?\nA:",
47 | "rationale": "Let's think step by step. First, we need to add up the number of watermelons that Joan and Tom grew. Joan grew 8 watermelons and Tom grew 9 watermelons, so the total number of watermelons is: 8 + 9 = 17 Therefore, Joan and Tom grew a total of 17 watermelons.",
48 | "pred_ans": "17",
49 | "gold_ans": "17"
50 | },
51 | {
52 | "question": "Q: Mary found 18 seashells and Jessica found 41 seashells on the beach . How many seashells did they find together ?\nA:",
53 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of seashells Mary found to the number of seashells Jessica found. 18 + 41 = 59 So, Mary and Jessica found a total of 59 seashells together.",
54 | "pred_ans": "59",
55 | "gold_ans": "59"
56 | },
57 | {
58 | "question": "Q: Sam has 16 blue and 25 green balloons . Alyssa has 21 blue balloons . How many blue balloons do they have in all ?\nA:",
59 | "rationale": "Let's think step by step. First, we need to add the number of blue balloons that Sam and Alyssa have. Sam has 16 blue balloons and Alyssa has 21 blue balloons, so the total number of blue balloons is: 16 + 21 = 37 Therefore, Sam and Alyssa have 37 blue balloons in all.",
60 | "pred_ans": "37",
61 | "gold_ans": "37"
62 | },
63 | {
64 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins . How many pounds of snacks did she buy in all ?\nA:",
65 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
66 | "pred_ans": "0.5",
67 | "gold_ans": "0.5"
68 | }
69 | ],
70 | "inertia": 154.0363311767578
71 | }
--------------------------------------------------------------------------------
/demos/addsub_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Mary found 18 seashells and Jessica found 41 seashells on the beach . How many seashells did they find together ?\nA:",
5 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of seashells Mary found to the number of seashells Jessica found. 18 + 41 = 59 So, Mary and Jessica found a total of 59 seashells together.",
6 | "pred_ans": "59",
7 | "gold_ans": "59"
8 | },
9 | {
10 | "question": "Q: Jason grew 23 watermelons and 18 turnips . Nancy grew 28 watermelons . How many watermelons did they grow in total ?\nA:",
11 | "rationale": "Let's think step by step. First, we need to add up the number of watermelons that Jason and Nancy grew. Jason grew 23 watermelons and Nancy grew 28 watermelons, so the total number of watermelons is: 23 + 28 = 51 Therefore, they grew a total of 51 watermelons.",
12 | "pred_ans": "51",
13 | "gold_ans": "51"
14 | },
15 | {
16 | "question": "Q: Sam had 49 pennies and 24 nickels in his bank . His dad gave him 39 nickels and 31 quarters . How many nickels does he have now ?\nA:",
17 | "rationale": "Let's think step by step. First, we need to find out how many total nickels Sam had before his dad gave him more. Sam had 24 nickels to start with, and his dad gave him 39 more nickels. So, Sam now has a total of 24 + 39 = 63 nickels.",
18 | "pred_ans": "63",
19 | "gold_ans": "63"
20 | },
21 | {
22 | "question": "Q: Last week Tim had 12 dollars and Keith had 36 dollars . Tim washed cars over the weekend and now has 75 dollars . How much money did Tim make washing cars ?\nA:",
23 | "rationale": "Let's think step by step. First, we need to find out how much money Tim made by subtracting his initial amount from his final amount. 75 - 12 = 63 This means that Tim made 63 dollars by washing cars over the weekend.",
24 | "pred_ans": "63",
25 | "gold_ans": "63"
26 | },
27 | {
28 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins . How many pounds of snacks did she buy in all ?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
30 | "pred_ans": "0.5",
31 | "gold_ans": "0.5"
32 | },
33 | {
34 | "question": "Q: Sam has 86 yellow and 20 green marbles . Joan took 25 of Sam 's yellow marbles . How many yellow marbles does Sam now have ?\nA:",
35 | "rationale": "Let's think step by step. First, we need to subtract the 25 yellow marbles that Joan took from Sam's original 86 yellow marbles. 86 - 25 = 61 So Sam now has 61 yellow marbles.",
36 | "pred_ans": "61",
37 | "gold_ans": "61"
38 | },
39 | {
40 | "question": "Q: There are 34 dogwood trees currently in the park . Park workers will plant 49 dogwood trees today . How many dogwood trees will the park have when the workers are finished ?\nA:",
41 | "rationale": "Let's think step by step. First, we need to add the number of dogwood trees currently in the park to the number of trees that will be planted today. So, we can write it as: 34 (current trees) + 49 (newly planted trees) = 83 Therefore, the park will have 83 dogwood trees when the workers are finished planting.",
42 | "pred_ans": "83",
43 | "gold_ans": "83"
44 | },
45 | {
46 | "question": "Q: There are 33 pencils and 44 crayons in the drawer . Joan placed 27 pencils in the drawer . How many pencils are now there in total ?\nA:",
47 | "rationale": "Let's think step by step. First, we need to add the number of pencils that were already in the drawer (33) to the number of pencils Joan placed in the drawer (27). 33 + 27 = 60 So there are now 60 pencils in the drawer.",
48 | "pred_ans": "60",
49 | "gold_ans": "60"
50 | }
51 | ],
52 | "inertia": 163.63787841796875
53 | }
--------------------------------------------------------------------------------
/demos/addsub_gpt-3.5-turbo-0301_9:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Sam has 86 yellow and 20 green marbles . Joan took 25 of Sam 's yellow marbles . How many yellow marbles does Sam now have ?\nA:",
5 | "rationale": "Let's think step by step. First, we need to subtract the 25 yellow marbles that Joan took from Sam's original 86 yellow marbles. 86 - 25 = 61 So Sam now has 61 yellow marbles.",
6 | "pred_ans": "61",
7 | "gold_ans": "61"
8 | },
9 | {
10 | "question": "Q: Mary found 18 seashells and Jessica found 41 seashells on the beach . How many seashells did they find together ?\nA:",
11 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of seashells Mary found to the number of seashells Jessica found. 18 + 41 = 59 So, Mary and Jessica found a total of 59 seashells together.",
12 | "pred_ans": "59",
13 | "gold_ans": "59"
14 | },
15 | {
16 | "question": "Q: There are 41 crayons and 26 pencils in the drawer . Sam placed 12 crayons in the drawer . How many crayons are now there in total ?\nA:",
17 | "rationale": "Let's think step by step. First, we need to add the number of crayons that were originally in the drawer (41) with the number of crayons that Sam placed in the drawer (12). 41 + 12 = 53 So there are now 53 crayons in the drawer.",
18 | "pred_ans": "53",
19 | "gold_ans": "53"
20 | },
21 | {
22 | "question": "Q: There are 34 dogwood trees currently in the park . Park workers will plant 49 dogwood trees today . How many dogwood trees will the park have when the workers are finished ?\nA:",
23 | "rationale": "Let's think step by step. First, we need to add the number of dogwood trees currently in the park to the number of trees that will be planted today. So, we can write it as: 34 (current trees) + 49 (newly planted trees) = 83 Therefore, the park will have 83 dogwood trees when the workers are finished planting.",
24 | "pred_ans": "83",
25 | "gold_ans": "83"
26 | },
27 | {
28 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins . How many pounds of snacks did she buy in all ?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
30 | "pred_ans": "0.5",
31 | "gold_ans": "0.5"
32 | },
33 | {
34 | "question": "Q: Jason grew 23 watermelons and 18 turnips . Nancy grew 28 watermelons . How many watermelons did they grow in total ?\nA:",
35 | "rationale": "Let's think step by step. First, we need to add up the number of watermelons that Jason and Nancy grew. Jason grew 23 watermelons and Nancy grew 28 watermelons, so the total number of watermelons is: 23 + 28 = 51 Therefore, they grew a total of 51 watermelons.",
36 | "pred_ans": "51",
37 | "gold_ans": "51"
38 | },
39 | {
40 | "question": "Q: Eve ran 0.7 mile and walked 0.6 mile . How much farther did Eve run than walk ?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the difference between the distance Eve ran and walked. To do this, we can subtract the distance she walked from the distance she ran: 0.7 miles - 0.6 miles = 0.1 miles Therefore, Eve ran 0.1 miles farther than she walked.",
42 | "pred_ans": "0.1",
43 | "gold_ans": "0.1"
44 | },
45 | {
46 | "question": "Q: Last week Tim had 12 dollars and Keith had 36 dollars . Tim washed cars over the weekend and now has 75 dollars . How much money did Tim make washing cars ?\nA:",
47 | "rationale": "Let's think step by step. First, we need to find out how much money Tim made by subtracting his initial amount from his final amount. 75 - 12 = 63 This means that Tim made 63 dollars by washing cars over the weekend.",
48 | "pred_ans": "63",
49 | "gold_ans": "63"
50 | },
51 | {
52 | "question": "Q: Sam had 49 pennies and 24 nickels in his bank . His dad gave him 39 nickels and 31 quarters . How many nickels does he have now ?\nA:",
53 | "rationale": "Let's think step by step. First, we need to find out how many total nickels Sam had before his dad gave him more. Sam had 24 nickels to start with, and his dad gave him 39 more nickels. So, Sam now has a total of 24 + 39 = 63 nickels.",
54 | "pred_ans": "63",
55 | "gold_ans": "63"
56 | }
57 | ],
58 | "inertia": 160.9029998779297
59 | }
--------------------------------------------------------------------------------
/demos/addsub_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There are 15 trees in the grove. Grove workers will plant trees in the grove today. After they are done, there will be 21 trees. How many trees did the grove workers plant today?\nA:",
5 | "rationale": "There are 15 trees originally. Then there were 21 trees after some more were planted. So there must have been 21 - 15 = 6.",
6 | "pred_ans": "6"
7 | },
8 | {
9 | "question": "Q: If there are 3 cars in the parking lot and 2 more cars arrive, how many cars are in the parking lot?\nA:",
10 | "rationale": "There are originally 3 cars. 2 more cars arrive. 3 + 2 = 5.",
11 | "pred_ans": "5"
12 | },
13 | {
14 | "question": "Q: Leah had 32 chocolates and her sister had 42. If they ate 35, how many pieces do they have left in total?\nA:",
15 | "rationale": "Originally, Leah had 32 chocolates. Her sister had 42. So in total they had 32 + 42 = 74. After eating 35, they had 74 - 35 = 39.",
16 | "pred_ans": "39"
17 | },
18 | {
19 | "question": "Q: Jason had 20 lollipops. He gave Denny some lollipops. Now Jason has 12 lollipops. How many lollipops did Jason give to Denny?\nA:",
20 | "rationale": "Jason started with 20 lollipops. Then he had 12 after giving some to Denny. So he gave Denny 20 - 12 = 8.",
21 | "pred_ans": "8"
22 | },
23 | {
24 | "question": "Q: Shawn has five toys. For Christmas, he got two toys each from his mom and dad. How many toys does he have now?\nA:",
25 | "rationale": "Shawn started with 5 toys. If he got 2 toys each from his mom and dad, then that is 4 more toys. 5 + 4 = 9.",
26 | "pred_ans": "9"
27 | },
28 | {
29 | "question": "Q: There were nine computers in the server room. Five more computers were installed each day, from monday to thursday. How many computers are now in the server room?\nA:",
30 | "rationale": "There were originally 9 computers. For each of 4 days, 5 more computers were added. So 5 * 4 = 20 computers were added. 9 + 20 is 29.",
31 | "pred_ans": "29"
32 | },
33 | {
34 | "question": "Q: Michael had 58 golf balls. On tuesday, he lost 23 golf balls. On wednesday, he lost 2 more. How many golf balls did he have at the end of wednesday?\nA:",
35 | "rationale": "Michael started with 58 golf balls. After losing 23 on tuesday, he had 58 - 23 = 35. After losing 2 more, he had 35 - 2 = 33 golf balls.",
36 | "pred_ans": "33"
37 | },
38 | {
39 | "question": "Q: Olivia has $23. She bought five bagels for $3 each. How much money does she have left?\nA:",
40 | "rationale": "Olivia had 23 dollars. 5 bagels for 3 dollars each will be 5 x 3 = 15 dollars. So she has 23 - 15 dollars left. 23 - 15 is 8.",
41 | "pred_ans": "8"
42 | }
43 | ]
44 | }
--------------------------------------------------------------------------------
/demos/aqua_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: If Jill needed to buy 10 bottles of soda for a party in which 8 people attended, how many bottles of soda will she need to buy for a party in which 12 people are attending? Answer Choices: (A) 6 (B) 8 (C) 10 (D) 12 (E) 14\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. First, we know that Jill needed 10 bottles of soda for a party with 8 people. So, on average, each person drank 10/8 = 1.25 bottles of soda. Now, we need to figure out how many bottles of soda Jill will need for a party with 12 people. If each person drinks an average of 1.25 bottles of soda, then for 12 people, Jill will need 12 x 1.25 = 15 bottles of soda. However, the answer choices don't include 15, so we need to round to the nearest option. The closest option is (E) 14, which is only one bottle less than what we calculated. So, the answer is (E) 14.",
6 | "pred_ans": "E",
7 | "gold_ans": "C"
8 | },
9 | {
10 | "question": "Q: Three bells ring at intervals of 36 seconds, 40 seconds and 48 seconds, respectively. They start ringing together at a particular time. When they will ring together again? Answer Choices: (A) After 6 minutes (B) After 12 minutes (C) After 18 minutes (D) After 24 minutes (E) none\nA:",
11 | "rationale": "Let's think step by step. First, we need to find the time it takes for all three bells to ring together. To do this, we need to find the least common multiple (LCM) of 36, 40, and 48. The prime factorization of 36 is 2^2 x 3^2. The prime factorization of 40 is 2^3 x 5. The prime factorization of 48 is 2^4 x 3. To find the LCM, we need to take the highest power of each prime factor that appears in any of the numbers. So the LCM is 2^4 x 3^2 x 5 = 720 seconds.",
12 | "pred_ans": "B",
13 | "gold_ans": "B"
14 | },
15 | {
16 | "question": "Q: A man spends 70% of his income. If his income increases by 20%, then what will be his new expenditure? Answer Choices: (A) 58.3% (B) 62.5% (C) 63.5% (D) 64.5% (E) 65.5%\nA:",
17 | "rationale": "Let's think step by step. First, let's assume the man's income is $100. Then, he spends 70% of it, which is $70. If his income increases by 20%, then his new income will be $120. To find his new expenditure, we need to find 70% of $120, which is $84. Therefore, his new expenditure is $84 out of $120, which is 70%. So the answer is (A) 58.3%.",
18 | "pred_ans": "A",
19 | "gold_ans": "A"
20 | },
21 | {
22 | "question": "Q: A paper is in a square form whose one side is 20 cm. Two semi circles are drawn on its opposites as diameters. If these semi circles are cut down what is the area of the remaining paper? Answer Choices: (A) 8.75 (B) 8.79 (C) 8.75 (D) 8.71 (E) 8.72\nA:",
23 | "rationale": "Let's think step by step. First, we need to find the area of the square paper. The formula for the area of a square is side x side, so the area of the paper is 20 x 20 = 400 cm². Next, we need to find the area of the two semi-circles. The formula for the area of a circle is πr², but since we only have semi-circles, we need to divide the result by 2. The diameter of the semi-circles is 20 cm, so the radius is 10 cm. Therefore, the area of one semi-circle is 1/2 x π x 10² = 50π/2 = 25π cm². The area of two semi-circles is 50π cm². Finally, we need to subtract the area of the two semi-circles from the area of the square paper to find the remaining area. So, the remaining area is 400 - 50π ≈ 8.79 cm².",
24 | "pred_ans": "B",
25 | "gold_ans": "C"
26 | }
27 | ]
28 | }
--------------------------------------------------------------------------------
/demos/aqua_gpt-3.5-turbo-0301_11:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Three bells ring at intervals of 36 seconds, 40 seconds and 48 seconds, respectively. They start ringing together at a particular time. When they will ring together again? Answer Choices: (A) After 6 minutes (B) After 12 minutes (C) After 18 minutes (D) After 24 minutes (E) none\nA:",
5 | "rationale": "Let's think step by step. First, we need to find the time it takes for all three bells to ring together. To do this, we need to find the least common multiple (LCM) of 36, 40, and 48. The prime factorization of 36 is 2^2 x 3^2. The prime factorization of 40 is 2^3 x 5. The prime factorization of 48 is 2^4 x 3. To find the LCM, we need to take the highest power of each prime factor that appears in any of the numbers. So the LCM is 2^4 x 3^2 x 5 = 720 seconds.",
6 | "pred_ans": "B",
7 | "gold_ans": "B"
8 | },
9 | {
10 | "question": "Q: There are ten lime soda bottles on a table in a restaurant. They are to be served among two different groups of customers consisting of 5 members each. How many ways are there to create these 2 groups? Answer Choices: (A) 90 (B) 105 (C) 126 (D) 252 (E) 525\nA:",
11 | "rationale": "Let's think step by step. First, we need to choose 5 bottles out of the 10 for the first group. This can be done in 10 choose 5 ways, which is equal to 252. After the first group has been served, there will be 5 bottles left for the second group. We need to choose 5 bottles out of these 5 for the second group. This can be done in only 1 way. Therefore, the total number of ways to create the 2 groups is 252 x 1 = 252. So the answer is (D) 252.",
12 | "pred_ans": "D",
13 | "gold_ans": "D"
14 | },
15 | {
16 | "question": "Q: If Jill needed to buy 10 bottles of soda for a party in which 8 people attended, how many bottles of soda will she need to buy for a party in which 12 people are attending? Answer Choices: (A) 6 (B) 8 (C) 10 (D) 12 (E) 14\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. First, we know that Jill needed 10 bottles of soda for a party with 8 people. So, on average, each person drank 10/8 = 1.25 bottles of soda. Now, we need to figure out how many bottles of soda Jill will need for a party with 12 people. If each person drinks an average of 1.25 bottles of soda, then for 12 people, Jill will need 12 x 1.25 = 15 bottles of soda. However, the answer choices don't include 15, so we need to round to the nearest option. The closest option is (E) 14, which is only one bottle less than what we calculated. So, the answer is (E) 14.",
18 | "pred_ans": "E",
19 | "gold_ans": "C"
20 | },
21 | {
22 | "question": "Q: A man spends 70% of his income. If his income increases by 20%, then what will be his new expenditure? Answer Choices: (A) 58.3% (B) 62.5% (C) 63.5% (D) 64.5% (E) 65.5%\nA:",
23 | "rationale": "Let's think step by step. First, let's assume the man's income is $100. Then, he spends 70% of it, which is $70. If his income increases by 20%, then his new income will be $120. To find his new expenditure, we need to find 70% of $120, which is $84. Therefore, his new expenditure is $84 out of $120, which is 70%. So the answer is (A) 58.3%.",
24 | "pred_ans": "A",
25 | "gold_ans": "A"
26 | },
27 | {
28 | "question": "Q: What should come in place of the question mark(?) in each of the following questions ?\nA:",
29 | "rationale": "Let's think step by step. First, we need to simplify the left-hand side of the equation: a2 - b2/(a + b)2 = (a + b)(a - b)/(a + b)2 Next, we can cancel out the (a + b) terms in the numerator and denominator: (a - b)/(a + b) This simplifies to (A) (a + b).",
30 | "pred_ans": "A",
31 | "gold_ans": "A"
32 | },
33 | {
34 | "question": "Q: A paper is in a square form whose one side is 20 cm. Two semi circles are drawn on its opposites as diameters. If these semi circles are cut down what is the area of the remaining paper? Answer Choices: (A) 8.75 (B) 8.79 (C) 8.75 (D) 8.71 (E) 8.72\nA:",
35 | "rationale": "Let's think step by step. First, we need to find the area of the square paper. The formula for the area of a square is side x side, so the area of the paper is 20 x 20 = 400 cm². Next, we need to find the area of the two semi-circles. The formula for the area of a circle is πr², but since we only have semi-circles, we need to divide the result by 2. The diameter of the semi-circles is 20 cm, so the radius is 10 cm. Therefore, the area of one semi-circle is 1/2 x π x 10² = 50π/2 = 25π cm². The area of two semi-circles is 50π cm². Finally, we need to subtract the area of the two semi-circles from the area of the square paper to find the remaining area. So, the remaining area is 400 - 50π ≈ 8.79 cm².",
36 | "pred_ans": "B",
37 | "gold_ans": "C"
38 | },
39 | {
40 | "question": "Q: When I was 2 years old, my brother was half my age. Now I am 60 years old, how old is my brother? Answer Choices: (A) A) 59 (B) B) 69 (C) C) 79 (D) D) 89 (E) E) 99\nA:",
41 | "rationale": "Let's think step by step. When you were 2 years old, your brother was half your age, which means he was 1 year old. Now you are 60 years old, and since your brother was 1 year younger than you, he is 60 - 1 = 59 years old.",
42 | "pred_ans": "A",
43 | "gold_ans": "A"
44 | }
45 | ],
46 | "inertia": 135.32827758789062
47 | }
--------------------------------------------------------------------------------
/demos/aqua_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: When I was 2 years old, my brother was half my age. Now I am 60 years old, how old is my brother? Answer Choices: (A) A) 59 (B) B) 69 (C) C) 79 (D) D) 89 (E) E) 99\nA:",
5 | "rationale": "Let's think step by step. When you were 2 years old, your brother was half your age, which means he was 1 year old. Now you are 60 years old, and since your brother was 1 year younger than you, he is 60 - 1 = 59 years old.",
6 | "pred_ans": "A",
7 | "gold_ans": "A"
8 | },
9 | {
10 | "question": "Q: If 120 is reduced to 96, what is the reduction percent? Answer Choices: (A) 30% (B) 40% (C) 20% (D) 10% (E) 5%\nA:",
11 | "rationale": "Let's think step by step. First, we need to find the difference between the original value and the reduced value: 120 - 96 = 24 Next, we need to find what percentage of the original value the difference represents: (24/120) x 100% = 20% Therefore, the reduction percent is 20%, which corresponds to answer choice (C).",
12 | "pred_ans": "C",
13 | "gold_ans": "C"
14 | },
15 | {
16 | "question": "Q: A man spends 70% of his income. If his income increases by 20%, then what will be his new expenditure? Answer Choices: (A) 58.3% (B) 62.5% (C) 63.5% (D) 64.5% (E) 65.5%\nA:",
17 | "rationale": "Let's think step by step. First, let's assume the man's income is $100. Then, he spends 70% of it, which is $70. If his income increases by 20%, then his new income will be $120. To find his new expenditure, we need to find 70% of $120, which is $84. Therefore, his new expenditure is $84 out of $120, which is 70%. So the answer is (A) 58.3%.",
18 | "pred_ans": "A",
19 | "gold_ans": "A"
20 | },
21 | {
22 | "question": "Q: Three bells ring at intervals of 36 seconds, 40 seconds and 48 seconds, respectively. They start ringing together at a particular time. When they will ring together again? Answer Choices: (A) After 6 minutes (B) After 12 minutes (C) After 18 minutes (D) After 24 minutes (E) none\nA:",
23 | "rationale": "Let's think step by step. First, we need to find the time it takes for all three bells to ring together. To do this, we need to find the least common multiple (LCM) of 36, 40, and 48. The prime factorization of 36 is 2^2 x 3^2. The prime factorization of 40 is 2^3 x 5. The prime factorization of 48 is 2^4 x 3. To find the LCM, we need to take the highest power of each prime factor that appears in any of the numbers. So the LCM is 2^4 x 3^2 x 5 = 720 seconds.",
24 | "pred_ans": "B",
25 | "gold_ans": "B"
26 | },
27 | {
28 | "question": "Q: A paper is in a square form whose one side is 20 cm. Two semi circles are drawn on its opposites as diameters. If these semi circles are cut down what is the area of the remaining paper? Answer Choices: (A) 8.75 (B) 8.79 (C) 8.75 (D) 8.71 (E) 8.72\nA:",
29 | "rationale": "Let's think step by step. First, we need to find the area of the square paper. The formula for the area of a square is side x side, so the area of the paper is 20 x 20 = 400 cm². Next, we need to find the area of the two semi-circles. The formula for the area of a circle is πr², but since we only have semi-circles, we need to divide the result by 2. The diameter of the semi-circles is 20 cm, so the radius is 10 cm. Therefore, the area of one semi-circle is 1/2 x π x 10² = 50π/2 = 25π cm². The area of two semi-circles is 50π cm². Finally, we need to subtract the area of the two semi-circles from the area of the square paper to find the remaining area. So, the remaining area is 400 - 50π ≈ 8.79 cm².",
30 | "pred_ans": "B",
31 | "gold_ans": "C"
32 | },
33 | {
34 | "question": "Q: What is the units digit of 9^3-7? Answer Choices: (A) 1 (B) 3 (C) 5 (D) 2 (E) 4\nA:",
35 | "rationale": "Let's think step by step. Sure! We can start by finding the units digit of $9^3$. The units digit of $9^1$ is 9, the units digit of $9^2$ is 1, and the units digit of $9^3$ is 9. So, $9^3$ has a units digit of 9. Next, we subtract 7 from $9^3$. Since 9 minus 7 is 2, the units digit of $9^3-7$ is $\\boxed{\\textbf{(D)}\\ 2}$.",
36 | "pred_ans": "D",
37 | "gold_ans": "D"
38 | },
39 | {
40 | "question": "Q: M men agree to purchase a gift for Rs. D. If 3 men drop out how much more will each have to contribute towards the purchase of the gift? Answer Choices: (A) D/ (M-3) (B) MD/3 (C) M/ (D-3) (D) 3D/ (M2-3M) (E) None of these\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break down the problem. We know that initially, M men agreed to purchase a gift for Rs. D. Therefore, each man would have to contribute D/M rupees towards the gift. Now, if 3 men drop out, the total number of men left would be M-3. The total amount of money required to purchase the gift would still be D rupees. Therefore, each man would now have to contribute D/(M-3) rupees towards the gift. So, the answer is (A) D/(M-3).",
42 | "pred_ans": "A",
43 | "gold_ans": "D"
44 | },
45 | {
46 | "question": "Q: There are ten lime soda bottles on a table in a restaurant. They are to be served among two different groups of customers consisting of 5 members each. How many ways are there to create these 2 groups? Answer Choices: (A) 90 (B) 105 (C) 126 (D) 252 (E) 525\nA:",
47 | "rationale": "Let's think step by step. First, we need to choose 5 bottles out of the 10 for the first group. This can be done in 10 choose 5 ways, which is equal to 252. After the first group has been served, there will be 5 bottles left for the second group. We need to choose 5 bottles out of these 5 for the second group. This can be done in only 1 way. Therefore, the total number of ways to create the 2 groups is 252 x 1 = 252. So the answer is (D) 252.",
48 | "pred_ans": "D",
49 | "gold_ans": "D"
50 | }
51 | ],
52 | "inertia": 139.77273559570312
53 | }
--------------------------------------------------------------------------------
/demos/aqua_gpt-3.5-turbo-0301_9:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Three bells ring at intervals of 36 seconds, 40 seconds and 48 seconds, respectively. They start ringing together at a particular time. When they will ring together again? Answer Choices: (A) After 6 minutes (B) After 12 minutes (C) After 18 minutes (D) After 24 minutes (E) none\nA:",
5 | "rationale": "Let's think step by step. First, we need to find the time it takes for all three bells to ring together. To do this, we need to find the least common multiple (LCM) of 36, 40, and 48. The prime factorization of 36 is 2^2 x 3^2. The prime factorization of 40 is 2^3 x 5. The prime factorization of 48 is 2^4 x 3. To find the LCM, we need to take the highest power of each prime factor that appears in any of the numbers. So the LCM is 2^4 x 3^2 x 5 = 720 seconds.",
6 | "pred_ans": "B",
7 | "gold_ans": "B"
8 | },
9 | {
10 | "question": "Q: What is the units digit of 9^3-7? Answer Choices: (A) 1 (B) 3 (C) 5 (D) 2 (E) 4\nA:",
11 | "rationale": "Let's think step by step. Sure! We can start by finding the units digit of $9^3$. The units digit of $9^1$ is 9, the units digit of $9^2$ is 1, and the units digit of $9^3$ is 9. So, $9^3$ has a units digit of 9. Next, we subtract 7 from $9^3$. Since 9 minus 7 is 2, the units digit of $9^3-7$ is $\\boxed{\\textbf{(D)}\\ 2}$.",
12 | "pred_ans": "D",
13 | "gold_ans": "D"
14 | },
15 | {
16 | "question": "Q: A paper is in a square form whose one side is 20 cm. Two semi circles are drawn on its opposites as diameters. If these semi circles are cut down what is the area of the remaining paper? Answer Choices: (A) 8.75 (B) 8.79 (C) 8.75 (D) 8.71 (E) 8.72\nA:",
17 | "rationale": "Let's think step by step. First, we need to find the area of the square paper. The formula for the area of a square is side x side, so the area of the paper is 20 x 20 = 400 cm². Next, we need to find the area of the two semi-circles. The formula for the area of a circle is πr², but since we only have semi-circles, we need to divide the result by 2. The diameter of the semi-circles is 20 cm, so the radius is 10 cm. Therefore, the area of one semi-circle is 1/2 x π x 10² = 50π/2 = 25π cm². The area of two semi-circles is 50π cm². Finally, we need to subtract the area of the two semi-circles from the area of the square paper to find the remaining area. So, the remaining area is 400 - 50π ≈ 8.79 cm².",
18 | "pred_ans": "B",
19 | "gold_ans": "C"
20 | },
21 | {
22 | "question": "Q: If 120 is reduced to 96, what is the reduction percent? Answer Choices: (A) 30% (B) 40% (C) 20% (D) 10% (E) 5%\nA:",
23 | "rationale": "Let's think step by step. First, we need to find the difference between the original value and the reduced value: 120 - 96 = 24 Next, we need to find what percentage of the original value the difference represents: (24/120) x 100% = 20% Therefore, the reduction percent is 20%, which corresponds to answer choice (C).",
24 | "pred_ans": "C",
25 | "gold_ans": "C"
26 | },
27 | {
28 | "question": "Q: There are ten lime soda bottles on a table in a restaurant. They are to be served among two different groups of customers consisting of 5 members each. How many ways are there to create these 2 groups? Answer Choices: (A) 90 (B) 105 (C) 126 (D) 252 (E) 525\nA:",
29 | "rationale": "Let's think step by step. First, we need to choose 5 bottles out of the 10 for the first group. This can be done in 10 choose 5 ways, which is equal to 252. After the first group has been served, there will be 5 bottles left for the second group. We need to choose 5 bottles out of these 5 for the second group. This can be done in only 1 way. Therefore, the total number of ways to create the 2 groups is 252 x 1 = 252. So the answer is (D) 252.",
30 | "pred_ans": "D",
31 | "gold_ans": "D"
32 | },
33 | {
34 | "question": "Q: A man spends 70% of his income. If his income increases by 20%, then what will be his new expenditure? Answer Choices: (A) 58.3% (B) 62.5% (C) 63.5% (D) 64.5% (E) 65.5%\nA:",
35 | "rationale": "Let's think step by step. First, let's assume the man's income is $100. Then, he spends 70% of it, which is $70. If his income increases by 20%, then his new income will be $120. To find his new expenditure, we need to find 70% of $120, which is $84. Therefore, his new expenditure is $84 out of $120, which is 70%. So the answer is (A) 58.3%.",
36 | "pred_ans": "A",
37 | "gold_ans": "A"
38 | },
39 | {
40 | "question": "Q: When I was 2 years old, my brother was half my age. Now I am 60 years old, how old is my brother? Answer Choices: (A) A) 59 (B) B) 69 (C) C) 79 (D) D) 89 (E) E) 99\nA:",
41 | "rationale": "Let's think step by step. When you were 2 years old, your brother was half your age, which means he was 1 year old. Now you are 60 years old, and since your brother was 1 year younger than you, he is 60 - 1 = 59 years old.",
42 | "pred_ans": "A",
43 | "gold_ans": "A"
44 | }
45 | ],
46 | "inertia": 138.06207275390625
47 | }
--------------------------------------------------------------------------------
/demos/aqua_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: John found that the average of 15 numbers is 40. If 10 is added to each number then the mean of the numbers is? Answer Choices: (A) 50 (B) 45 (C) 65 (D) 78 (E) 64\nA:",
5 | "rationale": "If 10 is added to each number, then the mean of the numbers also increases by 10. So the new mean would be 50. The answer is (A).",
6 | "pred_ans": "A"
7 | },
8 | {
9 | "question": "Q: If a / b = 3/4 and 8a + 5b = 22,then find the value of a. Answer Choices: (A) 1/2 (B) 3/2 (C) 5/2 (D) 4/2 (E) 7/2\nA:",
10 | "rationale": "If a / b = 3/4, then b = 4a / 3. So 8a + 5(4a / 3) = 22. This simplifies to 8a + 20a / 3 = 22, which means 44a / 3 = 22. So a is equal to 3/2. The answer is (B).",
11 | "pred_ans": "B"
12 | },
13 | {
14 | "question": "Q: A person is traveling at 20 km/hr and reached his destiny in 2.5 hr then find the distance? Answer Choices: (A) 53 km (B) 55 km (C) 52 km (D) 60 km (E) 50 km\nA:",
15 | "rationale": "The distance that the person traveled would have been 20 km/hr * 2.5 hrs = 50 km. The answer is (E).",
16 | "pred_ans": "E"
17 | },
18 | {
19 | "question": "Q: How many keystrokes are needed to type the numbers from 1 to 500? Answer Choices: (A) 1156 (B) 1392 (C) 1480 (D) 1562 (E) 1788\nA:",
20 | "rationale": "There are 9 one-digit numbers from 1 to 9. There are 90 two-digit numbers from 10 to 99. There are 401 three-digit numbers from 100 to 500. 9 + 90(2) + 401(3) = 1392. The answer is (B).",
21 | "pred_ans": "B"
22 | }
23 | ]
24 | }
--------------------------------------------------------------------------------
/demos/coin_flip_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: A coin is heads up. Len does not flip the coin. Marquis flips the coin. Kylie flips the coin. Sandra flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
5 | "rationale": "Let's think step by step. Initially, the coin is heads up. Marquis flips the coin, which means he reverses it. So now the coin is tails up. Kylie flips the coin, which means she also reverses it. Since the coin was tails up, it is now heads up again. Sandra flips the coin, which means she reverses it. Since the coin was heads up, it is now tails up. So, after all three people have flipped the coin, it is tails up.",
6 | "pred_ans": "no",
7 | "gold_ans": "no"
8 | },
9 | {
10 | "question": "Q: A coin is heads up. Pancho flips the coin. Claudio flips the coin. Elaine does not flip the coin. Vicky does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
11 | "rationale": "Let's think step by step. 1. The coin is heads up. 2. Pancho flips the coin, which means it is now tails up. 3. Claudio flips the coin again, which means it is now heads up again. 4. Elaine and Vicky do not flip the coin, so it remains heads up. Therefore, the coin is still heads up.",
12 | "pred_ans": "yes",
13 | "gold_ans": "yes"
14 | },
15 | {
16 | "question": "Q: A coin is heads up. Claudia flips the coin. Cole does not flip the coin. Matthew does not flip the coin. Juan Pablo does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
17 | "rationale": "Let's think step by step. Initially, the coin is heads up. Claudia flips the coin, which means she reverses it. So now the coin is tails up. However, Cole, Matthew, and Juan Pablo do not flip the coin, which means they do not reverse it. Therefore, the coin remains tails up.",
18 | "pred_ans": "no",
19 | "gold_ans": "no"
20 | },
21 | {
22 | "question": "Q: A coin is heads up. Daphne does not flip the coin. Lola flips the coin. Joanna does not flip the coin. Sheena does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
23 | "rationale": "Let's think step by step. Initially, the coin is heads up. Daphne does not flip the coin, so it remains heads up. Lola flips the coin, which means it is now tails up. Joanna and Sheena do not flip the coin, so it remains tails up. Therefore, the coin is not still heads up. It is now tails up.",
24 | "pred_ans": "no",
25 | "gold_ans": "no"
26 | },
27 | {
28 | "question": "Q: A coin is heads up. Kristen flips the coin. Herbert flips the coin. Benny does not flip the coin. El does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
29 | "rationale": "Let's think step by step. 1. The coin is initially heads up. 2. Kristen flips the coin, which means she reverses it. So now it is tails up. 3. Herbert flips the coin, which means he also reverses it. So now it is heads up again. 4. Benny and El do not flip the coin, so it remains heads up. Therefore, the coin is still heads up at the end.",
30 | "pred_ans": "yes",
31 | "gold_ans": "yes"
32 | },
33 | {
34 | "question": "Q: A coin is heads up. Carlos does not flip the coin. Jackie does not flip the coin. Callie flips the coin. Caitlin flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
35 | "rationale": "Let's think step by step. 1. The coin is heads up. 2. Carlos and Jackie do not flip the coin, so it remains heads up. 3. Callie flips the coin, which means it is now tails up. 4. Caitlin flips the coin again, which means it is now heads up again. So, the final answer is yes, the coin is still heads up.",
36 | "pred_ans": "yes",
37 | "gold_ans": "yes"
38 | },
39 | {
40 | "question": "Q: A coin is heads up. Camilo flips the coin. Becky does not flip the coin. Eliza does not flip the coin. Rebecca does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
41 | "rationale": "Let's think step by step. Initially, the coin is heads up. Camilo flips the coin, which means he reverses it. So now the coin is tails up. However, Becky, Eliza, and Rebecca do not flip the coin, which means they do not change its orientation. Therefore, the coin remains tails up.",
42 | "pred_ans": "no",
43 | "gold_ans": "no"
44 | },
45 | {
46 | "question": "Q: A coin is heads up. Juliet flips the coin. Ricardo does not flip the coin. Tita does not flip the coin. Dianna flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
47 | "rationale": "Let's think step by step. Initially, the coin is heads up. Juliet flips the coin, which means she reverses it. So now the coin is tails up. Ricardo and Tita do not flip the coin, so it remains tails up. Finally, Dianna flips the coin, which means she reverses it again. So now the coin is heads up again.",
48 | "pred_ans": "yes",
49 | "gold_ans": "yes"
50 | }
51 | ]
52 | }
--------------------------------------------------------------------------------
/demos/coin_flip_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: A coin is heads up. Len does not flip the coin. Marquis flips the coin. Kylie flips the coin. Sandra flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
5 | "rationale": "Let's think step by step. Initially, the coin is heads up. Marquis flips the coin, which means he reverses it. So now the coin is tails up. Kylie flips the coin, which means she also reverses it. Since the coin was tails up, it is now heads up again. Sandra flips the coin, which means she reverses it. Since the coin was heads up, it is now tails up. So, after all three people have flipped the coin, it is tails up.",
6 | "pred_ans": "no",
7 | "gold_ans": "no"
8 | },
9 | {
10 | "question": "Q: A coin is heads up. Pancho flips the coin. Claudio flips the coin. Elaine does not flip the coin. Vicky does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
11 | "rationale": "Let's think step by step. 1. The coin is heads up. 2. Pancho flips the coin, which means it is now tails up. 3. Claudio flips the coin again, which means it is now heads up again. 4. Elaine and Vicky do not flip the coin, so it remains heads up. Therefore, the coin is still heads up.",
12 | "pred_ans": "yes",
13 | "gold_ans": "yes"
14 | },
15 | {
16 | "question": "Q: A coin is heads up. Claudia flips the coin. Cole does not flip the coin. Matthew does not flip the coin. Juan Pablo does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
17 | "rationale": "Let's think step by step. Initially, the coin is heads up. Claudia flips the coin, which means she reverses it. So now the coin is tails up. However, Cole, Matthew, and Juan Pablo do not flip the coin, which means they do not reverse it. Therefore, the coin remains tails up.",
18 | "pred_ans": "no",
19 | "gold_ans": "no"
20 | },
21 | {
22 | "question": "Q: A coin is heads up. Daphne does not flip the coin. Lola flips the coin. Joanna does not flip the coin. Sheena does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
23 | "rationale": "Let's think step by step. Initially, the coin is heads up. Daphne does not flip the coin, so it remains heads up. Lola flips the coin, which means it is now tails up. Joanna and Sheena do not flip the coin, so it remains tails up. Therefore, the coin is not still heads up. It is now tails up.",
24 | "pred_ans": "no",
25 | "gold_ans": "no"
26 | },
27 | {
28 | "question": "Q: A coin is heads up. Kristen flips the coin. Herbert flips the coin. Benny does not flip the coin. El does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
29 | "rationale": "Let's think step by step. 1. The coin is initially heads up. 2. Kristen flips the coin, which means she reverses it. So now it is tails up. 3. Herbert flips the coin, which means he also reverses it. So now it is heads up again. 4. Benny and El do not flip the coin, so it remains heads up. Therefore, the coin is still heads up at the end.",
30 | "pred_ans": "yes",
31 | "gold_ans": "yes"
32 | },
33 | {
34 | "question": "Q: A coin is heads up. Carlos does not flip the coin. Jackie does not flip the coin. Callie flips the coin. Caitlin flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
35 | "rationale": "Let's think step by step. 1. The coin is heads up. 2. Carlos and Jackie do not flip the coin, so it remains heads up. 3. Callie flips the coin, which means it is now tails up. 4. Caitlin flips the coin again, which means it is now heads up again. So, the final answer is yes, the coin is still heads up.",
36 | "pred_ans": "yes",
37 | "gold_ans": "yes"
38 | },
39 | {
40 | "question": "Q: A coin is heads up. Camilo flips the coin. Becky does not flip the coin. Eliza does not flip the coin. Rebecca does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
41 | "rationale": "Let's think step by step. Initially, the coin is heads up. Camilo flips the coin, which means he reverses it. So now the coin is tails up. However, Becky, Eliza, and Rebecca do not flip the coin, which means they do not change its orientation. Therefore, the coin remains tails up.",
42 | "pred_ans": "no",
43 | "gold_ans": "no"
44 | },
45 | {
46 | "question": "Q: A coin is heads up. Juliet flips the coin. Ricardo does not flip the coin. Tita does not flip the coin. Dianna flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
47 | "rationale": "Let's think step by step. Initially, the coin is heads up. Juliet flips the coin, which means she reverses it. So now the coin is tails up. Ricardo and Tita do not flip the coin, so it remains tails up. Finally, Dianna flips the coin, which means she reverses it again. So now the coin is heads up again.",
48 | "pred_ans": "yes",
49 | "gold_ans": "yes"
50 | }
51 | ],
52 | "inertia": 91.1930923461914
53 | }
--------------------------------------------------------------------------------
/demos/coin_flip_gpt-3.5-turbo-0301_9:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: A coin is heads up. Billie does not flip the coin. Paloma does not flip the coin. Tanner does not flip the coin. Raul does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
5 | "rationale": "Let's think step by step. 1. The coin is initially heads up. 2. No one flips the coin, meaning no one reverses it. 3. Therefore, the coin is still heads up. So, yes, the coin is still heads up.",
6 | "pred_ans": "yes",
7 | "gold_ans": "yes"
8 | },
9 | {
10 | "question": "Q: A coin is heads up. Juana does not flip the coin. Chip does not flip the coin. Lila does not flip the coin. Jayme does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
11 | "rationale": "Let's think step by step. First, we know that the coin is heads up. Then, we are told that no one flips the coin, meaning that it is not reversed. Therefore, the coin is still heads up.",
12 | "pred_ans": "yes",
13 | "gold_ans": "yes"
14 | },
15 | {
16 | "question": "Q: A coin is heads up. Claudia flips the coin. Cole does not flip the coin. Matthew does not flip the coin. Juan Pablo does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
17 | "rationale": "Let's think step by step. Initially, the coin is heads up. Claudia flips the coin, which means she reverses it. So now the coin is tails up. However, Cole, Matthew, and Juan Pablo do not flip the coin, which means they do not reverse it. Therefore, the coin remains tails up.",
18 | "pred_ans": "no",
19 | "gold_ans": "no"
20 | },
21 | {
22 | "question": "Q: A coin is heads up. Emilia flips the coin. Jonas flips the coin. Christi does not flip the coin. Sophia does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
23 | "rationale": "Let's think step by step. 1. The coin is initially heads up. 2. Emilia flips the coin, which means it is now tails up. 3. Jonas flips the coin, which means it is now heads up again. 4. Christi and Sophia do not flip the coin, so it remains heads up. Therefore, the coin is still heads up.",
24 | "pred_ans": "yes",
25 | "gold_ans": "yes"
26 | },
27 | {
28 | "question": "Q: A coin is heads up. Carlos does not flip the coin. Jackie does not flip the coin. Callie flips the coin. Caitlin flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
29 | "rationale": "Let's think step by step. 1. The coin is heads up. 2. Carlos and Jackie do not flip the coin, so it remains heads up. 3. Callie flips the coin, which means it is now tails up. 4. Caitlin flips the coin again, which means it is now heads up again. So, the final answer is yes, the coin is still heads up.",
30 | "pred_ans": "yes",
31 | "gold_ans": "yes"
32 | },
33 | {
34 | "question": "Q: A coin is heads up. Juliet flips the coin. Ricardo does not flip the coin. Tita does not flip the coin. Dianna flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
35 | "rationale": "Let's think step by step. Initially, the coin is heads up. Juliet flips the coin, which means she reverses it. So now the coin is tails up. Ricardo and Tita do not flip the coin, so it remains tails up. Finally, Dianna flips the coin, which means she reverses it again. So now the coin is heads up again.",
36 | "pred_ans": "yes",
37 | "gold_ans": "yes"
38 | },
39 | {
40 | "question": "Q: A coin is heads up. Len does not flip the coin. Marquis flips the coin. Kylie flips the coin. Sandra flips the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
41 | "rationale": "Let's think step by step. Initially, the coin is heads up. Marquis flips the coin, which means he reverses it. So now the coin is tails up. Kylie flips the coin, which means she also reverses it. Since the coin was tails up, it is now heads up again. Sandra flips the coin, which means she reverses it. Since the coin was heads up, it is now tails up. So, after all three people have flipped the coin, it is tails up.",
42 | "pred_ans": "no",
43 | "gold_ans": "no"
44 | },
45 | {
46 | "question": "Q: A coin is heads up. Luisa does not flip the coin. Tatiana does not flip the coin. Drake does not flip the coin. Hillary does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
47 | "rationale": "Let's think step by step. First, we know that the coin is heads up. Then, we are told that no one flips the coin, meaning that it is not reversed. Therefore, the coin is still heads up.",
48 | "pred_ans": "yes",
49 | "gold_ans": "yes"
50 | },
51 | {
52 | "question": "Q: A coin is heads up. Deandre does not flip the coin. Moe does not flip the coin. Jack does not flip the coin. Vanessa does not flip the coin. Is the coin still heads up? Note that \"flip\" here means \"reverse\".\nA:",
53 | "rationale": "Let's think step by step. First, we know that the coin is heads up. Then, we are told that no one flips the coin, meaning that it is not reversed. Therefore, the coin is still heads up.",
54 | "pred_ans": "yes",
55 | "gold_ans": "yes"
56 | }
57 | ],
58 | "inertia": 90.61432647705078
59 | }
--------------------------------------------------------------------------------
/demos/coin_flip_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: A coin is heads up. Ka flips the coin. Sherrie flips the coin. Is the coin still heads up?\nA:",
5 | "rationale": "The coin was flipped by Ka and Sherrie. So the coin was flipped 2 times, which is an even number. The coin started heads up, so after an even number of flips, it will still be heads up. So the answer is yes.",
6 | "pred_ans": "yes"
7 | },
8 | {
9 | "question": "Q: A coin is heads up. Jamey flips the coin. Teressa flips the coin. Is the coin still heads up?\nA:",
10 | "rationale": "The coin was flipped by Jamey and Teressa. So the coin was flipped 2 times, which is an even number. The coin started heads up, so after an even number of flips, it will still be heads up. So the answer is yes.",
11 | "pred_ans": "yes"
12 | },
13 | {
14 | "question": "Q: A coin is heads up. Maybelle flips the coin. Shalonda does not flip the coin. Is the coin still heads up?\nA:",
15 | "rationale": "The coin was flipped by Maybelle. So the coin was flipped 1 time, which is an odd number. The coin started heads up, so after an odd number of flips, it will be tails up. So the answer is no.",
16 | "pred_ans": "no"
17 | },
18 | {
19 | "question": "Q: A coin is heads up. Millicent does not flip the coin. Conception flips the coin. Is the coin still heads up?\nA:",
20 | "rationale": "The coin was flipped by Conception. So the coin was flipped 1 time, which is an odd number. The coin started heads up, so after an odd number of flips, it will be tails up. So the answer is no.",
21 | "pred_ans": "no"
22 | },
23 | {
24 | "question": "Q: A coin is heads up. Sal flips the coin. Raymond does not flip the coin. Is the coin still heads up?\nA:",
25 | "rationale": "The coin was flipped by Sal. So the coin was flipped 1 time, which is an odd number. The coin started heads up, so after an odd number of flips, it will be tails up. So the answer is no.",
26 | "pred_ans": "no"
27 | },
28 | {
29 | "question": "Q: A coin is heads up. Conception flips the coin. Kristian does not flip the coin. Is the coin still heads up?\nA:",
30 | "rationale": "The coin was flipped by Conception. So the coin was flipped 1 time, which is an odd number. The coin started heads up, so after an odd number of flips, it will be tails up. So the answer is no.",
31 | "pred_ans": "no"
32 | },
33 | {
34 | "question": "Q: A coin is heads up. Inga does not flip the coin. Elanor does not flip the coin. Is the coin still heads up?\nA:",
35 | "rationale": "The coin was flipped by no one. So the coin was flipped 0 times. The coin started heads up, and it was not flipped, so it is still heads up. So the answer is yes.",
36 | "pred_ans": "yes"
37 | },
38 | {
39 | "question": "Q: A coin is heads up. Ryan flips the coin. Shaunda flips the coin. Is the coin still heads up?\nA:",
40 | "rationale": "The coin was flipped by Ryan and Shaunda. So the coin was flipped 2 times, which is an even number. The coin started heads up, so after an even number of flips, it will still be heads up. So the answer is yes.",
41 | "pred_ans": "yes"
42 | }
43 | ]
44 | }
--------------------------------------------------------------------------------
/demos/commonsensqa_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: If you are hungry and going fishing, why would you be going fishing? Answer Choices: (A) to see the fish (B) have fun (C) catching fish (D) wet clothes (E) killing\nA:",
5 | "rationale": "Let's think step by step. First, we need to understand the purpose of fishing. Fishing is typically done to catch fish for food or sport. So, if someone is hungry and going fishing, it is likely that they are going fishing to catch fish to eat. Therefore, the answer would be (C) catching fish.",
6 | "pred_ans": "C",
7 | "gold_ans": "C"
8 | },
9 | {
10 | "question": "Q: There was many a bottle to choose from behind the cashier where? Answer Choices: (A) grocery store (B) diaper bag (C) gas station (D) liquor store (E) medicine cabinet\nA:",
11 | "rationale": "Let's think step by step. First, we need to understand what the question is asking. The question is asking where there were many bottles to choose from behind the cashier. Next, we can eliminate answer choices that don't make sense. For example, (B) diaper bag and (E) medicine cabinet don't seem like places where there would be many bottles to choose from behind a cashier. We can also use our knowledge and common sense to eliminate answer choices. For example, a grocery store might have many bottles, but they would likely be on the shelves, not behind the cashier. That leaves us with (C) gas station and (D) liquor store. Both of these places could have many bottles behind the cashier. However, based on the context of the question, it seems more likely that the answer is (D) liquor store.",
12 | "pred_ans": "D",
13 | "gold_ans": "D"
14 | },
15 | {
16 | "question": "Q: A farmer sees a weasel in the woods, where is the farmer? Answer Choices: (A) chicken coop (B) beach (C) fairytale (D) great outdoors (E) corn fields\nA:",
17 | "rationale": "Let's think step by step. First, we need to understand the question and the answer choices. The question mentions a farmer seeing a weasel in the woods, and we are given five answer choices: (A) chicken coop, (B) beach, (C) fairytale, (D) great outdoors, and (E) corn fields. Next, we can eliminate answer choices that do not make sense. For example, we can eliminate (B) beach and (C) fairytale because they are not related to the woods or farming. We can also eliminate (A) chicken coop because the question mentions the farmer being in the woods, not in a chicken coop. This leaves us with (D) great outdoors and (E) corn fields. Both of these answer choices are related to farming and being outside, but only (D) great outdoors specifically mentions the woods. Therefore, the correct answer is (D) great outdoors.",
18 | "pred_ans": "D",
19 | "gold_ans": "D"
20 | },
21 | {
22 | "question": "Q: If a person were going to bed, what would be their goal? Answer Choices: (A) lazy (B) insomnia (C) rest (D) falling asleep (E) dreaming of\nA:",
23 | "rationale": "Let's think step by step. When a person goes to bed, their goal is usually to get some rest and fall asleep. So the correct answer would be (C) rest and (D) falling asleep.",
24 | "pred_ans": "C",
25 | "gold_ans": "D"
26 | },
27 | {
28 | "question": "Q: Surprising an angry person could lead to what? Answer Choices: (A) humor (B) fight (C) jocose (D) laughter (E) accidents\nA:",
29 | "rationale": "Let's think step by step. First, we need to understand the meaning of the word \"surprising\" in this context. Surprising someone means doing something unexpected or catching them off guard. Next, we need to consider the emotions of the person being surprised. In this case, they are described as \"angry.\" Based on these two pieces of information, we can eliminate answer choices (A) humor, (C) jocose, and (D) laughter. It is unlikely that someone who is already angry would suddenly find something humorous or start laughing if they were surprised. Answer choice (E) accidents is also unlikely, as it is not directly related to the emotions of the angry person. This leaves us with answer choice (B) fight. If someone is already angry and they are surprised in a way that they perceive as threatening or aggressive, it could escalate into a physical altercation. Therefore, the correct answer is (B) fight.",
30 | "pred_ans": "B",
31 | "gold_ans": "B"
32 | },
33 | {
34 | "question": "Q: Where would you find a ticket booth and see a concert? Answer Choices: (A) clerk (B) indoors (C) movie theater (D) venue (E) auditorium\nA:",
35 | "rationale": "Let's think step by step. First, we need to understand what a ticket booth is. A ticket booth is a small structure or booth where tickets are sold for events such as concerts, movies, or sports games. Next, we need to identify where one would see a concert. Concerts are typically held in specific locations designed for live performances, such as an auditorium or a venue. Therefore, the correct answer is (D) venue.",
36 | "pred_ans": "D",
37 | "gold_ans": "D"
38 | },
39 | {
40 | "question": "Q: His house was a mess, he began doing housework to get what? Answer Choices: (A) boredom (B) nice home (C) michigan (D) feeling satisfied (E) house clean\nA:",
41 | "rationale": "Let's think step by step. The question is asking what the person hoped to achieve by doing housework. We can eliminate options (A) boredom and (C) Michigan as they are not related to the situation. Option (B) a nice home could be a possibility, but it is not specific enough. Option (E) a clean house is definitely a goal of doing housework, but it is not the only one. Therefore, the best answer is (D) feeling satisfied, as it encompasses the idea that the person wanted to improve their living space and feel good about their accomplishment.",
42 | "pred_ans": "D",
43 | "gold_ans": "E"
44 | }
45 | ]
46 | }
--------------------------------------------------------------------------------
/demos/commonsensqa_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: What do people use to absorb extra ink from a fountain pen? Answer Choices: (A) shirt pocket (B) calligrapher’s hand (C) inkwell (D) desk drawer (E) blotter\nA:",
5 | "rationale": "The answer must be an item that can absorb ink. Of the above choices, only blotters are used to absorb ink. So the answer is (E).",
6 | "pred_ans": "E"
7 | },
8 | {
9 | "question": "Q: What home entertainment equipment requires cable? Answer Choices: (A) radio shack (B) substation (C) television (D) cabinet\nA:",
10 | "rationale": "The answer must require cable. Of the above choices, only television requires cable. So the answer is (C).",
11 | "pred_ans": "C"
12 | },
13 | {
14 | "question": "Q: The fox walked from the city into the forest, what was it looking for? Answer Choices: (A) pretty flowers (B) hen house (C) natural habitat (D) storybook\nA:",
15 | "rationale": "The answer must be something in the forest. Of the above choices, only natural habitat is in the forest. So the answer is (B).",
16 | "pred_ans": "B"
17 | },
18 | {
19 | "question": "Q: Sammy wanted to go to where the people were. Where might he go? Answer Choices: (A) populated areas (B) race track (C) desert (D) apartment (E) roadblock\nA:",
20 | "rationale": "The answer must be a place with a lot of people. Of the above choices, only populated areas have a lot of people. So the answer is (A).",
21 | "pred_ans": "A"
22 | },
23 | {
24 | "question": "Q: Where do you put your grapes just before checking out? Answer Choices: (A) mouth (B) grocery cart (C)super market (D) fruit basket (E) fruit market\nA:",
25 | "rationale": "The answer should be the place where grocery items are placed before checking out. Of the above choices, grocery cart makes the most sense for holding grocery items. So the answer is (B).",
26 | "pred_ans": "B"
27 | },
28 | {
29 | "question": "Q: Google Maps and other highway and street GPS services have replaced what? Answer Choices: (A) united states (B) mexico (C) countryside (D) atlas\nA:",
30 | "rationale": "The answer must be something that used to do what Google Maps and GPS services do, which is to give directions. Of the above choices, only atlases are used to give directions. So the answer is (D).",
31 | "pred_ans": "D"
32 | },
33 | {
34 | "question": "Q: Before getting a divorce, what did the wife feel who was doing all the work? Answer Choices: (A) harder (B) anguish (C) bitterness (D) tears (E) sadness\nA:",
35 | "rationale": "The answer should be the feeling of someone getting divorced who was doing all the work. Of the above choices, the closest feeling is bitterness. So the answer is (C).",
36 | "pred_ans": "C"
37 | }
38 | ]
39 | }
--------------------------------------------------------------------------------
/demos/gsm8k_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There are 15 trees in the grove. Grove workers will plant trees in the grove today. After they are done, there will be 21 trees. How many trees did the grove workers plant today?\nA:",
5 | "rationale": "There are 15 trees originally. Then there were 21 trees after some more were planted. So there must have been 21 - 15 = 6.",
6 | "pred_ans": "6"
7 | },
8 | {
9 | "question": "Q: If there are 3 cars in the parking lot and 2 more cars arrive, how many cars are in the parking lot?\nA:",
10 | "rationale": "There are originally 3 cars. 2 more cars arrive. 3 + 2 = 5.",
11 | "pred_ans": "5"
12 | },
13 | {
14 | "question": "Q: Leah had 32 chocolates and her sister had 42. If they ate 35, how many pieces do they have left in total?\nA:",
15 | "rationale": "Originally, Leah had 32 chocolates. Her sister had 42. So in total they had 32 + 42 = 74. After eating 35, they had 74 - 35 = 39.",
16 | "pred_ans": "39"
17 | },
18 | {
19 | "question": "Q: Jason had 20 lollipops. He gave Denny some lollipops. Now Jason has 12 lollipops. How many lollipops did Jason give to Denny?\nA:",
20 | "rationale": "Jason started with 20 lollipops. Then he had 12 after giving some to Denny. So he gave Denny 20 - 12 = 8.",
21 | "pred_ans": "8"
22 | },
23 | {
24 | "question": "Q: Shawn has five toys. For Christmas, he got two toys each from his mom and dad. How many toys does he have now?\nA:",
25 | "rationale": "Shawn started with 5 toys. If he got 2 toys each from his mom and dad, then that is 4 more toys. 5 + 4 = 9.",
26 | "pred_ans": "9"
27 | },
28 | {
29 | "question": "Q: There were nine computers in the server room. Five more computers were installed each day, from monday to thursday. How many computers are now in the server room?\nA:",
30 | "rationale": "There were originally 9 computers. For each of 4 days, 5 more computers were added. So 5 * 4 = 20 computers were added. 9 + 20 is 29.",
31 | "pred_ans": "29"
32 | },
33 | {
34 | "question": "Q: Michael had 58 golf balls. On tuesday, he lost 23 golf balls. On wednesday, he lost 2 more. How many golf balls did he have at the end of wednesday?\nA:",
35 | "rationale": "Michael started with 58 golf balls. After losing 23 on tuesday, he had 58 - 23 = 35. After losing 2 more, he had 35 - 2 = 33 golf balls.",
36 | "pred_ans": "33"
37 | },
38 | {
39 | "question": "Q: Olivia has $23. She bought five bagels for $3 each. How much money does she have left?\nA:",
40 | "rationale": "Olivia had 23 dollars. 5 bagels for 3 dollars each will be 5 x 3 = 15 dollars. So she has 23 - 15 dollars left. 23 - 15 is 8.",
41 | "pred_ans": "8"
42 | }
43 | ]
44 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
6 | "pred_ans": "oynn",
7 | "gold_ans": "oynn"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Issa Kendra Ignacio Henry\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Issa\" is \"a\". The last letter of \"Kendra\" is \"a\". The last letter of \"Ignacio\" is \"o\". The last letter of \"Henry\" is \"y\". So, if we concatenate these letters, we get \"aao y\".",
12 | "pred_ans": "aaoy",
13 | "gold_ans": "aaoy"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
18 | "pred_ans": "oodel",
19 | "gold_ans": "oedl"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
24 | "pred_ans": "hen",
25 | "gold_ans": "hhen"
26 | }
27 | ]
28 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_10:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Malcolm Hussein Franco Hugo\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The words are: Malcolm, Hussein, Franco, Hugo. We need to take the last letter of each word and concatenate them. So, the last letters are: m, n, o, o. And when we concatenate them, we get: mnoo.",
6 | "pred_ans": "mnoo",
7 | "gold_ans": "mnoo"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Sabrina Pete Mary La\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Sabrina, Pete, Mary, La. We need to take the last letter of each word and concatenate them. So, the last letters are: a (from Sabrina), e (from Pete), y (from Mary), a (from La). Now, we can concatenate them to get the final answer: aeya.",
12 | "pred_ans": "aeya",
13 | "gold_ans": "aeya"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Issa Kendra Ignacio Henry\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Issa\" is \"a\". The last letter of \"Kendra\" is \"a\". The last letter of \"Ignacio\" is \"o\". The last letter of \"Henry\" is \"y\". So, if we concatenate these letters, we get \"aao y\".",
18 | "pred_ans": "aaoy",
19 | "gold_ans": "aaoy"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Les Jun Noe Juliana\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to identify the words in the given phrase: \"Les Jun Noe Juliana\". The words are: Les, Jun, Noe, Juliana. Next, we need to take the last letter of each word. The last letters are: s, n, e, a. Finally, we need to concatenate these letters. So the answer is: snea.",
24 | "pred_ans": "snea",
25 | "gold_ans": "snea"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
30 | "pred_ans": "oynn",
31 | "gold_ans": "oynn"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Mel Josh Alejandra Harley\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Mel\" is \"l\". The last letter of \"Josh\" is \"h\". The last letter of \"Alejandra\" is \"a\". The last letter of \"Harley\" is \"y\". So if we concatenate these letters, we get \"lhay\".",
36 | "pred_ans": "lhay",
37 | "gold_ans": "lhay"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Mari Ximena Leo Antonia\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The first step is to identify the words in the given phrase: \"Mari Ximena Leo Antonia\". The words are: Mari, Ximena, Leo, Antonia. The next step is to take the last letter of each word. The last letters are: i, a, o, a. Finally, we concatenate these letters to form a new word. The new word is: \"iaoa\".",
42 | "pred_ans": "iaoa",
43 | "gold_ans": "iaoa"
44 | }
45 | ],
46 | "inertia": 142.83908081054688
47 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_11:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
6 | "pred_ans": "oodel",
7 | "gold_ans": "oedl"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Mel Josh Alejandra Harley\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Mel\" is \"l\". The last letter of \"Josh\" is \"h\". The last letter of \"Alejandra\" is \"a\". The last letter of \"Harley\" is \"y\". So if we concatenate these letters, we get \"lhay\".",
12 | "pred_ans": "lhay",
13 | "gold_ans": "lhay"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Malcolm Hussein Franco Hugo\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The words are: Malcolm, Hussein, Franco, Hugo. We need to take the last letter of each word and concatenate them. So, the last letters are: m, n, o, o. And when we concatenate them, we get: mnoo.",
18 | "pred_ans": "mnoo",
19 | "gold_ans": "mnoo"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
24 | "pred_ans": "hen",
25 | "gold_ans": "hhen"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Prince Rene Vishal Patrick\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Prince\" is \"e\". The last letter of \"Rene\" is \"e\". The last letter of \"Vishal\" is \"l\". The last letter of \"Patrick\" is \"k\". So, if we concatenate these letters, we get \"elk\".",
30 | "pred_ans": "elk",
31 | "gold_ans": "eelk"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
36 | "pred_ans": "oynn",
37 | "gold_ans": "oynn"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Sabrina Pete Mary La\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Sabrina, Pete, Mary, La. We need to take the last letter of each word and concatenate them. So, the last letters are: a (from Sabrina), e (from Pete), y (from Mary), a (from La). Now, we can concatenate them to get the final answer: aeya.",
42 | "pred_ans": "aeya",
43 | "gold_ans": "aeya"
44 | },
45 | {
46 | "question": "Q: Take the last letters of each words in \"Virginia Juanita Zak Wayne\" and concatenate them.\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Virginia\" is \"a\". The last letter of \"Juanita\" is \"a\". The last letter of \"Zak\" is \"k\". The last letter of \"Wayne\" is \"e\". So, if we concatenate these letters, we get \"ake\".",
48 | "pred_ans": "ake",
49 | "gold_ans": "aake"
50 | },
51 | {
52 | "question": "Q: Take the last letters of each words in \"Martin Sage Tanisha Rick\" and concatenate them.\nA:",
53 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Martin\" is \"n\". The last letter of \"Sage\" is \"e\". The last letter of \"Tanisha\" is \"a\". The last letter of \"Rick\" is \"k\". So, if we concatenate these letters, we get \"neak\".",
54 | "pred_ans": "neak",
55 | "gold_ans": "neak"
56 | }
57 | ],
58 | "inertia": 141.9680938720703
59 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_12:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Mel Josh Alejandra Harley\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Mel\" is \"l\". The last letter of \"Josh\" is \"h\". The last letter of \"Alejandra\" is \"a\". The last letter of \"Harley\" is \"y\". So if we concatenate these letters, we get \"lhay\".",
6 | "pred_ans": "lhay",
7 | "gold_ans": "lhay"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Russ Berta Mandy Lydia\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The words are \"Russ Berta Mandy Lydia\". The last letter of \"Russ\" is \"s\". The last letter of \"Berta\" is \"a\". The last letter of \"Mandy\" is \"y\". The last letter of \"Lydia\" is \"a\". So, if we concatenate these letters, we get \"say a\".",
12 | "pred_ans": "saya",
13 | "gold_ans": "saya"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Russell Mitchell Bee Faith\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Russell\" is \"l\". The last letter of \"Mitchell\" is \"l\". The last letter of \"Bee\" is \"e\". The last letter of \"Faith\" is \"h\". So, if we concatenate these letters, we get \"lleh\".",
18 | "pred_ans": "lleh",
19 | "gold_ans": "lleh"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
24 | "pred_ans": "oynn",
25 | "gold_ans": "oynn"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Kristen Herbert Benny El\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Kristen\" is \"n\". The last letter of \"Herbert\" is \"t\". The last letter of \"Benny\" is \"y\". The last letter of \"El\" is \"l\". So, if we concatenate these letters, we get \"ntyL\".",
30 | "pred_ans": "ntyL",
31 | "gold_ans": "ntyl"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Sabrina Pete Mary La\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Sabrina, Pete, Mary, La. We need to take the last letter of each word and concatenate them. So, the last letters are: a (from Sabrina), e (from Pete), y (from Mary), a (from La). Now, we can concatenate them to get the final answer: aeya.",
36 | "pred_ans": "aeya",
37 | "gold_ans": "aeya"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
42 | "pred_ans": "hen",
43 | "gold_ans": "hhen"
44 | },
45 | {
46 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
48 | "pred_ans": "oodel",
49 | "gold_ans": "oedl"
50 | },
51 | {
52 | "question": "Q: Take the last letters of each words in \"Brooklyn Dawn Tay Gene\" and concatenate them.\nA:",
53 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Brooklyn\" is \"n\". The last letter of \"Dawn\" is \"n\". The last letter of \"Tay\" is \"y\". The last letter of \"Gene\" is \"e\". So, if we concatenate these letters, we get \"nyye\".",
54 | "pred_ans": "nyye",
55 | "gold_ans": "nnye"
56 | }
57 | ],
58 | "inertia": 141.0727081298828
59 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_13:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Brooklyn Dawn Tay Gene\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Brooklyn\" is \"n\". The last letter of \"Dawn\" is \"n\". The last letter of \"Tay\" is \"y\". The last letter of \"Gene\" is \"e\". So, if we concatenate these letters, we get \"nyye\".",
6 | "pred_ans": "nyye",
7 | "gold_ans": "nnye"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Issa Kendra Ignacio Henry\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Issa\" is \"a\". The last letter of \"Kendra\" is \"a\". The last letter of \"Ignacio\" is \"o\". The last letter of \"Henry\" is \"y\". So, if we concatenate these letters, we get \"aao y\".",
12 | "pred_ans": "aaoy",
13 | "gold_ans": "aaoy"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Martin Sage Tanisha Rick\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Martin\" is \"n\". The last letter of \"Sage\" is \"e\". The last letter of \"Tanisha\" is \"a\". The last letter of \"Rick\" is \"k\". So, if we concatenate these letters, we get \"neak\".",
18 | "pred_ans": "neak",
19 | "gold_ans": "neak"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
24 | "pred_ans": "oynn",
25 | "gold_ans": "oynn"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Elle Alex Irma Stephan\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elle\" is \"e\". The last letter of \"Alex\" is \"x\". The last letter of \"Irma\" is \"a\". The last letter of \"Stephan\" is \"n\". So, if we concatenate these letters, we get \"exan\".",
30 | "pred_ans": "exan",
31 | "gold_ans": "exan"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
36 | "pred_ans": "oodel",
37 | "gold_ans": "oedl"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
42 | "pred_ans": "hen",
43 | "gold_ans": "hhen"
44 | },
45 | {
46 | "question": "Q: Take the last letters of each words in \"Regina Joel Justice Eli\" and concatenate them.\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Regina\" is \"a\". The last letter of \"Joel\" is \"l\". The last letter of \"Justice\" is \"e\". The last letter of \"Eli\" is \"i\". So, if we concatenate these letters, we get \"alei\".",
48 | "pred_ans": "alei",
49 | "gold_ans": "alei"
50 | }
51 | ],
52 | "inertia": 140.66937255859375
53 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_15:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Sabrina Pete Mary La\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Sabrina, Pete, Mary, La. We need to take the last letter of each word and concatenate them. So, the last letters are: a (from Sabrina), e (from Pete), y (from Mary), a (from La). Now, we can concatenate them to get the final answer: aeya.",
6 | "pred_ans": "aeya",
7 | "gold_ans": "aeya"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Prince Rene Vishal Patrick\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Prince\" is \"e\". The last letter of \"Rene\" is \"e\". The last letter of \"Vishal\" is \"l\". The last letter of \"Patrick\" is \"k\". So, if we concatenate these letters, we get \"elk\".",
12 | "pred_ans": "elk",
13 | "gold_ans": "eelk"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
18 | "pred_ans": "oynn",
19 | "gold_ans": "oynn"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Brooklyn Dawn Tay Gene\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Brooklyn\" is \"n\". The last letter of \"Dawn\" is \"n\". The last letter of \"Tay\" is \"y\". The last letter of \"Gene\" is \"e\". So, if we concatenate these letters, we get \"nyye\".",
24 | "pred_ans": "nyye",
25 | "gold_ans": "nnye"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Virginia Juanita Zak Wayne\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Virginia\" is \"a\". The last letter of \"Juanita\" is \"a\". The last letter of \"Zak\" is \"k\". The last letter of \"Wayne\" is \"e\". So, if we concatenate these letters, we get \"ake\".",
30 | "pred_ans": "ake",
31 | "gold_ans": "aake"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
36 | "pred_ans": "oodel",
37 | "gold_ans": "oedl"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Mari Ximena Leo Antonia\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The first step is to identify the words in the given phrase: \"Mari Ximena Leo Antonia\". The words are: Mari, Ximena, Leo, Antonia. The next step is to take the last letter of each word. The last letters are: i, a, o, a. Finally, we concatenate these letters to form a new word. The new word is: \"iaoa\".",
42 | "pred_ans": "iaoa",
43 | "gold_ans": "iaoa"
44 | },
45 | {
46 | "question": "Q: Take the last letters of each words in \"Issa Kendra Ignacio Henry\" and concatenate them.\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Issa\" is \"a\". The last letter of \"Kendra\" is \"a\". The last letter of \"Ignacio\" is \"o\". The last letter of \"Henry\" is \"y\". So, if we concatenate these letters, we get \"aao y\".",
48 | "pred_ans": "aaoy",
49 | "gold_ans": "aaoy"
50 | },
51 | {
52 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
53 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
54 | "pred_ans": "hen",
55 | "gold_ans": "hhen"
56 | },
57 | {
58 | "question": "Q: Take the last letters of each words in \"Elle Alex Irma Stephan\" and concatenate them.\nA:",
59 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elle\" is \"e\". The last letter of \"Alex\" is \"x\". The last letter of \"Irma\" is \"a\". The last letter of \"Stephan\" is \"n\". So, if we concatenate these letters, we get \"exan\".",
60 | "pred_ans": "exan",
61 | "gold_ans": "exan"
62 | },
63 | {
64 | "question": "Q: Take the last letters of each words in \"Memo Joey Phil Samuel\" and concatenate them.\nA:",
65 | "rationale": "Let's think step by step. Sure, let's break it down. The words are: Memo, Joey, Phil, Samuel. To get the last letter of each word, we simply take the letter that appears at the end of each word. So, the last letters are: o, y, l, l. To concatenate them means to join them together in order. So, if we put them together in order, we get: \"oyll\".",
66 | "pred_ans": "oyll",
67 | "gold_ans": "oyll"
68 | }
69 | ],
70 | "inertia": 139.52740478515625
71 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_17:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Virginia Juanita Zak Wayne\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Virginia\" is \"a\". The last letter of \"Juanita\" is \"a\". The last letter of \"Zak\" is \"k\". The last letter of \"Wayne\" is \"e\". So, if we concatenate these letters, we get \"ake\".",
6 | "pred_ans": "ake",
7 | "gold_ans": "aake"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Mel Josh Alejandra Harley\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Mel\" is \"l\". The last letter of \"Josh\" is \"h\". The last letter of \"Alejandra\" is \"a\". The last letter of \"Harley\" is \"y\". So if we concatenate these letters, we get \"lhay\".",
12 | "pred_ans": "lhay",
13 | "gold_ans": "lhay"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
18 | "pred_ans": "hen",
19 | "gold_ans": "hhen"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Malcolm Hussein Franco Hugo\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The words are: Malcolm, Hussein, Franco, Hugo. We need to take the last letter of each word and concatenate them. So, the last letters are: m, n, o, o. And when we concatenate them, we get: mnoo.",
24 | "pred_ans": "mnoo",
25 | "gold_ans": "mnoo"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Sabrina Pete Mary La\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Sabrina, Pete, Mary, La. We need to take the last letter of each word and concatenate them. So, the last letters are: a (from Sabrina), e (from Pete), y (from Mary), a (from La). Now, we can concatenate them to get the final answer: aeya.",
30 | "pred_ans": "aeya",
31 | "gold_ans": "aeya"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Russ Berta Mandy Lydia\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The words are \"Russ Berta Mandy Lydia\". The last letter of \"Russ\" is \"s\". The last letter of \"Berta\" is \"a\". The last letter of \"Mandy\" is \"y\". The last letter of \"Lydia\" is \"a\". So, if we concatenate these letters, we get \"say a\".",
36 | "pred_ans": "saya",
37 | "gold_ans": "saya"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
42 | "pred_ans": "oynn",
43 | "gold_ans": "oynn"
44 | },
45 | {
46 | "question": "Q: Take the last letters of each words in \"Issa Kendra Ignacio Henry\" and concatenate them.\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Issa\" is \"a\". The last letter of \"Kendra\" is \"a\". The last letter of \"Ignacio\" is \"o\". The last letter of \"Henry\" is \"y\". So, if we concatenate these letters, we get \"aao y\".",
48 | "pred_ans": "aaoy",
49 | "gold_ans": "aaoy"
50 | },
51 | {
52 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
53 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
54 | "pred_ans": "oodel",
55 | "gold_ans": "oedl"
56 | },
57 | {
58 | "question": "Q: Take the last letters of each words in \"Memo Joey Phil Samuel\" and concatenate them.\nA:",
59 | "rationale": "Let's think step by step. Sure, let's break it down. The words are: Memo, Joey, Phil, Samuel. To get the last letter of each word, we simply take the letter that appears at the end of each word. So, the last letters are: o, y, l, l. To concatenate them means to join them together in order. So, if we put them together in order, we get: \"oyll\".",
60 | "pred_ans": "oyll",
61 | "gold_ans": "oyll"
62 | }
63 | ],
64 | "inertia": 138.12693786621094
65 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_22:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Russ Berta Mandy Lydia\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The words are \"Russ Berta Mandy Lydia\". The last letter of \"Russ\" is \"s\". The last letter of \"Berta\" is \"a\". The last letter of \"Mandy\" is \"y\". The last letter of \"Lydia\" is \"a\". So, if we concatenate these letters, we get \"say a\".",
6 | "pred_ans": "saya",
7 | "gold_ans": "saya"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
12 | "pred_ans": "oodel",
13 | "gold_ans": "oedl"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Issa Kendra Ignacio Henry\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Issa\" is \"a\". The last letter of \"Kendra\" is \"a\". The last letter of \"Ignacio\" is \"o\". The last letter of \"Henry\" is \"y\". So, if we concatenate these letters, we get \"aao y\".",
18 | "pred_ans": "aaoy",
19 | "gold_ans": "aaoy"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Kristen Herbert Benny El\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Kristen\" is \"n\". The last letter of \"Herbert\" is \"t\". The last letter of \"Benny\" is \"y\". The last letter of \"El\" is \"l\". So, if we concatenate these letters, we get \"ntyL\".",
24 | "pred_ans": "ntyL",
25 | "gold_ans": "ntyl"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
30 | "pred_ans": "hen",
31 | "gold_ans": "hhen"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Mel Josh Alejandra Harley\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Mel\" is \"l\". The last letter of \"Josh\" is \"h\". The last letter of \"Alejandra\" is \"a\". The last letter of \"Harley\" is \"y\". So if we concatenate these letters, we get \"lhay\".",
36 | "pred_ans": "lhay",
37 | "gold_ans": "lhay"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
42 | "pred_ans": "oynn",
43 | "gold_ans": "oynn"
44 | },
45 | {
46 | "question": "Q: Take the last letters of each words in \"Sabrina Pete Mary La\" and concatenate them.\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Sabrina, Pete, Mary, La. We need to take the last letter of each word and concatenate them. So, the last letters are: a (from Sabrina), e (from Pete), y (from Mary), a (from La). Now, we can concatenate them to get the final answer: aeya.",
48 | "pred_ans": "aeya",
49 | "gold_ans": "aeya"
50 | },
51 | {
52 | "question": "Q: Take the last letters of each words in \"Malcolm Hussein Franco Hugo\" and concatenate them.\nA:",
53 | "rationale": "Let's think step by step. Sure, let's break it down. The words are: Malcolm, Hussein, Franco, Hugo. We need to take the last letter of each word and concatenate them. So, the last letters are: m, n, o, o. And when we concatenate them, we get: mnoo.",
54 | "pred_ans": "mnoo",
55 | "gold_ans": "mnoo"
56 | }
57 | ],
58 | "inertia": 135.64727783203125
59 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Marco Antonio Suzette Roland Isabel\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Marco\" is \"o\". The last letter of \"Antonio\" is \"o\". The last letter of \"Suzette\" is \"e\". The last letter of \"Roland\" is \"d\". The last letter of \"Isabel\" is \"l\". So if we concatenate these letters, we get \"oodel\".",
6 | "pred_ans": "oodel",
7 | "gold_ans": "oedl"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Elizabeth Mitch Brooke Jordyn\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elizabeth\" is \"h\". The last letter of \"Mitch\" is \"h\". The last letter of \"Brooke\" is \"e\". The last letter of \"Jordyn\" is \"n\". So, if we concatenate these letters, we get \"hen\".",
12 | "pred_ans": "hen",
13 | "gold_ans": "hhen"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Martin Sage Tanisha Rick\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Martin\" is \"n\". The last letter of \"Sage\" is \"e\". The last letter of \"Tanisha\" is \"a\". The last letter of \"Rick\" is \"k\". So, if we concatenate these letters, we get \"neak\".",
18 | "pred_ans": "neak",
19 | "gold_ans": "neak"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
24 | "pred_ans": "oynn",
25 | "gold_ans": "oynn"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Ivy Romeo Jana Ej\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Ivy, Romeo, Jana, Ej. We need to take the last letter of each word and concatenate them. So, the last letters are: y, o, a, j. Now, we can concatenate them to get the final answer: \"yoaj\".",
30 | "pred_ans": "yoaj",
31 | "gold_ans": "yoaj"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Virginia Juanita Zak Wayne\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Virginia\" is \"a\". The last letter of \"Juanita\" is \"a\". The last letter of \"Zak\" is \"k\". The last letter of \"Wayne\" is \"e\". So, if we concatenate these letters, we get \"ake\".",
36 | "pred_ans": "ake",
37 | "gold_ans": "aake"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Mel Josh Alejandra Harley\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Mel\" is \"l\". The last letter of \"Josh\" is \"h\". The last letter of \"Alejandra\" is \"a\". The last letter of \"Harley\" is \"y\". So if we concatenate these letters, we get \"lhay\".",
42 | "pred_ans": "lhay",
43 | "gold_ans": "lhay"
44 | }
45 | ],
46 | "inertia": 144.42977905273438
47 | }
--------------------------------------------------------------------------------
/demos/last_letters_gpt-3.5-turbo-0301_9:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Mel Josh Alejandra Harley\" and concatenate them.\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Mel\" is \"l\". The last letter of \"Josh\" is \"h\". The last letter of \"Alejandra\" is \"a\". The last letter of \"Harley\" is \"y\". So if we concatenate these letters, we get \"lhay\".",
6 | "pred_ans": "lhay",
7 | "gold_ans": "lhay"
8 | },
9 | {
10 | "question": "Q: Take the last letters of each words in \"Issa Kendra Ignacio Henry\" and concatenate them.\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Issa\" is \"a\". The last letter of \"Kendra\" is \"a\". The last letter of \"Ignacio\" is \"o\". The last letter of \"Henry\" is \"y\". So, if we concatenate these letters, we get \"aao y\".",
12 | "pred_ans": "aaoy",
13 | "gold_ans": "aaoy"
14 | },
15 | {
16 | "question": "Q: Take the last letters of each words in \"Elle Alex Irma Stephan\" and concatenate them.\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Elle\" is \"e\". The last letter of \"Alex\" is \"x\". The last letter of \"Irma\" is \"a\". The last letter of \"Stephan\" is \"n\". So, if we concatenate these letters, we get \"exan\".",
18 | "pred_ans": "exan",
19 | "gold_ans": "exan"
20 | },
21 | {
22 | "question": "Q: Take the last letters of each words in \"Ivy Romeo Jana Ej\" and concatenate them.\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Ivy, Romeo, Jana, Ej. We need to take the last letter of each word and concatenate them. So, the last letters are: y, o, a, j. Now, we can concatenate them to get the final answer: \"yoaj\".",
24 | "pred_ans": "yoaj",
25 | "gold_ans": "yoaj"
26 | },
27 | {
28 | "question": "Q: Take the last letters of each words in \"Celso Tracy Winston Anton\" and concatenate them.\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Celso\" is \"o\". The last letter of \"Tracy\" is \"y\". The last letter of \"Winston\" is \"n\". The last letter of \"Anton\" is \"n\". So, if we concatenate these letters, we get \"oynn\".",
30 | "pred_ans": "oynn",
31 | "gold_ans": "oynn"
32 | },
33 | {
34 | "question": "Q: Take the last letters of each words in \"Sabrina Pete Mary La\" and concatenate them.\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down. The given words are: Sabrina, Pete, Mary, La. We need to take the last letter of each word and concatenate them. So, the last letters are: a (from Sabrina), e (from Pete), y (from Mary), a (from La). Now, we can concatenate them to get the final answer: aeya.",
36 | "pred_ans": "aeya",
37 | "gold_ans": "aeya"
38 | },
39 | {
40 | "question": "Q: Take the last letters of each words in \"Virginia Juanita Zak Wayne\" and concatenate them.\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Virginia\" is \"a\". The last letter of \"Juanita\" is \"a\". The last letter of \"Zak\" is \"k\". The last letter of \"Wayne\" is \"e\". So, if we concatenate these letters, we get \"ake\".",
42 | "pred_ans": "ake",
43 | "gold_ans": "aake"
44 | },
45 | {
46 | "question": "Q: Take the last letters of each words in \"Malcolm Hussein Franco Hugo\" and concatenate them.\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. The words are: Malcolm, Hussein, Franco, Hugo. We need to take the last letter of each word and concatenate them. So, the last letters are: m, n, o, o. And when we concatenate them, we get: mnoo.",
48 | "pred_ans": "mnoo",
49 | "gold_ans": "mnoo"
50 | },
51 | {
52 | "question": "Q: Take the last letters of each words in \"Kristen Herbert Benny El\" and concatenate them.\nA:",
53 | "rationale": "Let's think step by step. Sure, let's break it down. The last letter of \"Kristen\" is \"n\". The last letter of \"Herbert\" is \"t\". The last letter of \"Benny\" is \"y\". The last letter of \"El\" is \"l\". So, if we concatenate these letters, we get \"ntyL\".",
54 | "pred_ans": "ntyL",
55 | "gold_ans": "ntyl"
56 | }
57 | ],
58 | "inertia": 143.28952026367188
59 | }
--------------------------------------------------------------------------------
/demos/last_letters_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Take the last letters of each words in \"Whitney Erika Tj Benito\" and concatenate them.\nA:",
5 | "rationale": "The last letter of \"Whitney\" is \"y\". The last letter of \"Erika\" is \"a\". The last letter of \"Tj\" is \"j\". The last letter of \"Benito\" is \"o\".Concatenating them is \"yajo\". The answer is yajo.",
6 | "pred_ans": "yajo"
7 | },
8 | {
9 | "question": "Q: Take the last letters of each words in \"Lucky Mireya Jj Kc\" and concatenate them.\nA:",
10 | "rationale": "The last letter of \"Lucky\" is \"y\". The last letter of \"Mireya\" is \"a\". The last letter of \"Jj\" is \"j\". The last letter of \"Kc\" is \"c\".Concatenating them is \"yajc\". The answer is yajc.",
11 | "pred_ans": "yajc"
12 | },
13 | {
14 | "question": "Q: Take the last letters of each words in \"Caleb Chase Eleazar Chanel\" and concatenate them.\nA:",
15 | "rationale": "The last letter of \"Caleb\" is \"b\". The last letter of \"Chase\" is \"e\". The last letter of \"Eleazar\" is \"r\". The last letter of \"Chanel\" is \"l\".Concatenating them is \"berl\". The answer is berl.",
16 | "pred_ans": "berl"
17 | },
18 | {
19 | "question": "Q: Take the last letters of each words in \"Silvia Carolina Stan Chuck\" and concatenate them.\nA:",
20 | "rationale": "The last letter of \"Silvia\" is \"a\". The last letter of \"Carolina\" is \"a\". The last letter of \"Stan\" is \"n\". The last letter of \"Chuck\" is \"k\".Concatenating them is \"aank\". The answer is aank.",
21 | "pred_ans": "aank"
22 | }
23 | ]
24 | }
--------------------------------------------------------------------------------
/demos/multiarith:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There were 8 friends playing a video game online when 2 more players joined the game. If each player had 6 lives, how many lives did they have total?\nA:",
5 | "rationale": "Let's think step by step. There were 8 friends playing a game. So, they had 8*6=48 lives in total. Then, 2 more players joined the game. So, the total number of lives became 8*6+2*6=60.",
6 | "pred_ans": "60",
7 | "gold_ans": "60"
8 | },
9 | {
10 | "question": "Q: The school cafeteria ordered 8 red apples and 43 green apples for students lunches. But, if only 42 students wanted fruit, how many extra did the cafeteria end up with?\nA:",
11 | "rationale": "Let's think step by step. The school cafeteria ordered 8 red apples and 43 green apples for students lunches. This means that they ordered a total of 51 apples. But, if only 42 students wanted fruit, This means that the school cafeteria would have 9 apples leftover.",
12 | "pred_ans": "9",
13 | "gold_ans": "9"
14 | },
15 | {
16 | "question": "Q: Bianca was organizing her book case making sure each of the shelves had exactly 8 books on it. If she had 5 shelves of mystery books and 4 shelves of picture books, how many books did she have total?\nA:",
17 | "rationale": "Let's think step by step. There are 5 shelves of mystery books. Each shelf has 8 books. So that's 40 mystery books. There are 4 shelves of picture books. Each shelf has 8 books. So that's 32 picture books. 40 + 32 = 72 books.",
18 | "pred_ans": "72",
19 | "gold_ans": "72"
20 | },
21 | {
22 | "question": "Q: Mike made 69 dollars mowing lawns over the summer. If he spent 24 dollars buying new mower blades, how many 5 dollar games could he buy with the money he had left?\nA:",
23 | "rationale": "Let's think step by step. Mike made $69 from mowing lawns. He spent $24 on new mower blades. That means he has $45 left. Each game costs $5, so he could buy 9 games.",
24 | "pred_ans": "9",
25 | "gold_ans": "9"
26 | },
27 | {
28 | "question": "Q: A pet store had 78 puppies. In one day they sold 30 of them and put the rest into cages with 8 in each cage. How many cages did they use?\nA:",
29 | "rationale": "Let's think step by step. There are 78 puppies. 30 are sold, so that means there are 48 left. 48 divided by 8 is 6, so that means there are 6 cages with 8 puppies in each.",
30 | "pred_ans": "6",
31 | "gold_ans": "6"
32 | },
33 | {
34 | "question": "Q: Wendy uploaded 45 pictures to Facebook. She put 27 pics into one album and put the rest into 9 different albums. How many pictures were in each album?\nA:",
35 | "rationale": "Let's think step by step. First, we know that Wendy uploaded 45 pictures in total. Second, we know that Wendy put 27 pictures into one album. That means that Wendy put the remaining 18 pictures into 9 different albums. That means that each album would have 2 pictures.",
36 | "pred_ans": "2",
37 | "gold_ans": "2"
38 | },
39 | {
40 | "question": "Q: For Halloween Katie and her sister combined the candy they received. Katie had 8 pieces of candy while her sister had 23. If they ate 8 pieces the first night, how many pieces do they have left?\nA:",
41 | "rationale": "Let's think step by step. Katie and her sister have a total of 8 + 23 = 31 pieces of candy. If they eat 8 pieces the first night, they have 31 - 8 = 23 pieces left.",
42 | "pred_ans": "23",
43 | "gold_ans": "23"
44 | },
45 | {
46 | "question": "Q: For the school bake sale Maria made 19 cupcakes. If she sold 5 of them and then made 10 more, how many cupcakes would she have?\nA:",
47 | "rationale": "Let's think step by step. First, Maria made 19 cupcakes. Then, she sold 5 of them. So now she has 14 cupcakes. Then, she made 10 more. So now she has 24 cupcakes.",
48 | "pred_ans": "24",
49 | "gold_ans": "24"
50 | }
51 | ]
52 | }
--------------------------------------------------------------------------------
/demos/multiarith_auto:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Wendy uploaded 45 pictures to Facebook. She put 27 pics into one album and put the rest into 9 different albums. How many pictures were in each album?\nA:",
5 | "rationale": "Let's think step by step. First, we know that Wendy uploaded 45 pictures in total. Second, we know that Wendy put 27 pictures into one album. That means that Wendy put the remaining 18 pictures into 9 different albums. That means that each album would have 2 pictures.",
6 | "pred_ans": "2",
7 | "gold_ans": "2"
8 | },
9 | {
10 | "question": "Q: For Halloween Katie and her sister combined the candy they received. Katie had 8 pieces of candy while her sister had 23. If they ate 8 pieces the first night, how many pieces do they have left?\nA:",
11 | "rationale": "Let's think step by step. Katie and her sister have a total of 8 + 23 = 31 pieces of candy. If they eat 8 pieces the first night, they have 31 - 8 = 23 pieces left.",
12 | "pred_ans": "23",
13 | "gold_ans": "23"
14 | },
15 | {
16 | "question": "Q: Bianca was organizing her book case making sure each of the shelves had exactly 8 books on it. If she had 5 shelves of mystery books and 4 shelves of picture books, how many books did she have total?\nA:",
17 | "rationale": "Let's think step by step. There are 5 shelves of mystery books. Each shelf has 8 books. So that's 40 mystery books. There are 4 shelves of picture books. Each shelf has 8 books. So that's 32 picture books. 40 + 32 = 72 books.",
18 | "pred_ans": "72",
19 | "gold_ans": "72"
20 | },
21 | {
22 | "question": "Q: A pet store had 78 puppies. In one day they sold 30 of them and put the rest into cages with 8 in each cage. How many cages did they use?\nA:",
23 | "rationale": "Let's think step by step. There are 78 puppies. 30 are sold, so that means there are 48 left. 48 divided by 8 is 6, so that means there are 6 cages with 8 puppies in each.",
24 | "pred_ans": "6",
25 | "gold_ans": "6"
26 | },
27 | {
28 | "question": "Q: A waiter had 14 customers to wait on. If 3 customers left and he got another 39 customers, how many customers would he have?\nA:",
29 | "rationale": "Let's think step by step. The waiter had 14 customers to wait on. If 3 customers left, that means he would have 11 customers left. If he got another 39 customers, that means he would have 50 customers in total.",
30 | "pred_ans": "50",
31 | "gold_ans": "50"
32 | },
33 | {
34 | "question": "Q: A trivia team had 7 members total, but during a game 2 members didn't show up. If each member that did show up scored 4 points, how many points were scored total?\nA:",
35 | "rationale": "Let's think step by step. There were 7 members on the team, but 2 members didn't show up. That means that there were 5 members that did show up. Each member that showed up scored 4 points. So if 5 members each scored 4 points, then the total number of points scored would be 5*4=20.",
36 | "pred_ans": "20",
37 | "gold_ans": "20"
38 | },
39 | {
40 | "question": "Q: Gwen had 18 math problems and 11 science problems for homework. If she finished 24 of the problems at school, how many problems did she have to do for homework?\nA:",
41 | "rationale": "Let's think step by step. Gwen had 18 math problems and 11 science problems for homework. That means she had a total of 29 problems for homework. If she finished 24 of the problems at school, that means she had 5 problems left to do for homework.",
42 | "pred_ans": "5",
43 | "gold_ans": "5"
44 | },
45 | {
46 | "question": "Q: Mike made 69 dollars mowing lawns over the summer. If he spent 24 dollars buying new mower blades, how many 5 dollar games could he buy with the money he had left?\nA:",
47 | "rationale": "Let's think step by step. Mike made $69 from mowing lawns. He spent $24 on new mower blades. That means he has $45 left. Each game costs $5, so he could buy 9 games.",
48 | "pred_ans": "9",
49 | "gold_ans": "9"
50 | }
51 | ]
52 | }
--------------------------------------------------------------------------------
/demos/multiarith_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: The school cafeteria ordered 25 red apples and 17 green apples for students lunches. But, if only 10 students wanted fruit, how many extra did the cafeteria end up with?\nA:",
5 | "rationale": "Let's think step by step. First, we need to find the total number of apples ordered by the cafeteria, which is 25 + 17 = 42 apples. Next, we need to find out how many apples each student would get if only 10 students wanted fruit. To do this, we divide the total number of apples by the number of students: 42 ÷ 10 = 4.2 apples per student. Since we can't have a fraction of an apple, we need to round down to the nearest whole number. Each student would get 4 apples. So, if only 10 students wanted fruit, they would need a total of 10 x 4 = 40 apples. Therefore, the cafeteria would end up with 42 - 40 = 2 extra apples.",
6 | "pred_ans": "2",
7 | "gold_ans": "32"
8 | },
9 | {
10 | "question": "Q: For the school bake sale Chloe made 28 cupcakes. If she sold 25 of them and then made 8 more, how many cupcakes would she have?\nA:",
11 | "rationale": "Let's think step by step. First, Chloe made 28 cupcakes. Then, she sold 25 of them. So, she would have 28 - 25 = 3 cupcakes left. After that, she made 8 more cupcakes. So, she would have 3 + 8 = 11 cupcakes in total.",
12 | "pred_ans": "11",
13 | "gold_ans": "11"
14 | },
15 | {
16 | "question": "Q: There were 7 friends playing a video game online when 2 more players joined the game. If each player had 7 lives, how many lives did they have total?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. First, we know that there were 7 friends playing the game. So, they had a total of 7 x 7 = 49 lives. Next, 2 more players joined the game. So, we need to add their lives to the total. Each player has 7 lives, so 2 players would have 2 x 7 = 14 lives. Therefore, the total number of lives in the game would be 49 + 14 = 63 lives.",
18 | "pred_ans": "63",
19 | "gold_ans": "63"
20 | },
21 | {
22 | "question": "Q: A pet store has 8 bird cages. If each cage has 2 parrots and 7 parakeets in it, how many birds does the pet store have total?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find out how many birds are in each cage. We know that each cage has 2 parrots and 7 parakeets, so that's a total of 9 birds per cage. Next, we need to find out how many birds are in all of the cages combined. To do this, we can multiply the number of cages by the number of birds per cage: 8 cages x 9 birds per cage = 72 birds So the pet store has a total of 72 birds.",
24 | "pred_ans": "72",
25 | "gold_ans": "72"
26 | },
27 | {
28 | "question": "Q: Megan was organizing her book case making sure each of the shelves had exactly 7 books on it. If she had 8 shelves of mystery books and 2 shelves of picture books, how many books did she have total?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find out how many books Megan has on each shelf. She has 8 shelves of mystery books, and each shelf has 7 books, so she has 8 x 7 = 56 mystery books. Next, we need to find out how many books she has on the picture book shelves. She has 2 shelves of picture books, and each shelf has 7 books, so she has 2 x 7 = 14 picture books. Finally, we can add the number of mystery books and picture books together to find the total number of books Megan has. 56 + 14 = 70 books in total. Therefore, Megan has a total of 70 books.",
30 | "pred_ans": "70",
31 | "gold_ans": "70"
32 | },
33 | {
34 | "question": "Q: At lunch a waiter had 7 customers and 4 of them didn't leave a tip. If he got $9 each from the ones who did tip, how much money did he earn?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break down the problem. The waiter had 7 customers in total. Out of these 7 customers, 4 didn't leave a tip. So, the number of customers who left a tip is 7 - 4 = 3. The waiter got $9 each from the customers who left a tip. So, the total amount of money he earned from these customers is 3 x $9 = $27. Therefore, the waiter earned $27 in total.",
36 | "pred_ans": "27",
37 | "gold_ans": "27"
38 | },
39 | {
40 | "question": "Q: Mike made 69 dollars mowing lawns over the summer. If he spent 24 dollars buying new mower blades, how many 5 dollar games could he buy with the money he had left?\nA:",
41 | "rationale": "Let's think step by step. First, we need to find out how much money Mike has left after buying the new mower blades. We can do this by subtracting the cost of the blades from the amount of money he made: 69 dollars - 24 dollars = 45 dollars Now we know that Mike has 45 dollars left to spend on games. To find out how many 5 dollar games he can buy, we can divide the amount of money he has left by the cost of each game: 45 dollars ÷ 5 dollars/game = 9 games Therefore, Mike can buy 9 5-dollar games with the money he has left after buying the new mower blades.",
42 | "pred_ans": "9",
43 | "gold_ans": "9"
44 | },
45 | {
46 | "question": "Q: Wendy uploaded 45 pictures to Facebook. She put 27 pics into one album and put the rest into 9 different albums. How many pictures were in each album?\nA:",
47 | "rationale": "Let's think step by step. First, we know that Wendy put 27 pictures into one album. So, we subtract 27 from the total number of pictures to find out how many pictures were left to be distributed among the 9 albums. 45 - 27 = 18 Now we need to divide the remaining 18 pictures equally among the 9 albums. 18 ÷ 9 = 2 Therefore, there were 2 pictures in each of the 9 albums.",
48 | "pred_ans": "2",
49 | "gold_ans": "2"
50 | }
51 | ]
52 | }
--------------------------------------------------------------------------------
/demos/multiarith_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: The school cafeteria ordered 25 red apples and 17 green apples for students lunches. But, if only 10 students wanted fruit, how many extra did the cafeteria end up with?\nA:",
5 | "rationale": "Let's think step by step. First, we need to find the total number of apples ordered by the cafeteria, which is 25 + 17 = 42 apples. Next, we need to find out how many apples each student would get if only 10 students wanted fruit. To do this, we divide the total number of apples by the number of students: 42 ÷ 10 = 4.2 apples per student. Since we can't have a fraction of an apple, we need to round down to the nearest whole number. Each student would get 4 apples. So, if only 10 students wanted fruit, they would need a total of 10 x 4 = 40 apples. Therefore, the cafeteria would end up with 42 - 40 = 2 extra apples.",
6 | "pred_ans": "2",
7 | "gold_ans": "32"
8 | },
9 | {
10 | "question": "Q: For the school bake sale Chloe made 28 cupcakes. If she sold 25 of them and then made 8 more, how many cupcakes would she have?\nA:",
11 | "rationale": "Let's think step by step. First, Chloe made 28 cupcakes. Then, she sold 25 of them. So, she would have 28 - 25 = 3 cupcakes left. After that, she made 8 more cupcakes. So, she would have 3 + 8 = 11 cupcakes in total.",
12 | "pred_ans": "11",
13 | "gold_ans": "11"
14 | },
15 | {
16 | "question": "Q: There were 7 friends playing a video game online when 2 more players joined the game. If each player had 7 lives, how many lives did they have total?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. First, we know that there were 7 friends playing the game. So, they had a total of 7 x 7 = 49 lives. Next, 2 more players joined the game. So, we need to add their lives to the total. Each player has 7 lives, so 2 players would have 2 x 7 = 14 lives. Therefore, the total number of lives in the game would be 49 + 14 = 63 lives.",
18 | "pred_ans": "63",
19 | "gold_ans": "63"
20 | },
21 | {
22 | "question": "Q: A pet store has 8 bird cages. If each cage has 2 parrots and 7 parakeets in it, how many birds does the pet store have total?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find out how many birds are in each cage. We know that each cage has 2 parrots and 7 parakeets, so that's a total of 9 birds per cage. Next, we need to find out how many birds are in all of the cages combined. To do this, we can multiply the number of cages by the number of birds per cage: 8 cages x 9 birds per cage = 72 birds So the pet store has a total of 72 birds.",
24 | "pred_ans": "72",
25 | "gold_ans": "72"
26 | },
27 | {
28 | "question": "Q: Megan was organizing her book case making sure each of the shelves had exactly 7 books on it. If she had 8 shelves of mystery books and 2 shelves of picture books, how many books did she have total?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find out how many books Megan has on each shelf. She has 8 shelves of mystery books, and each shelf has 7 books, so she has 8 x 7 = 56 mystery books. Next, we need to find out how many books she has on the picture book shelves. She has 2 shelves of picture books, and each shelf has 7 books, so she has 2 x 7 = 14 picture books. Finally, we can add the number of mystery books and picture books together to find the total number of books Megan has. 56 + 14 = 70 books in total. Therefore, Megan has a total of 70 books.",
30 | "pred_ans": "70",
31 | "gold_ans": "70"
32 | },
33 | {
34 | "question": "Q: At lunch a waiter had 7 customers and 4 of them didn't leave a tip. If he got $9 each from the ones who did tip, how much money did he earn?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break down the problem. The waiter had 7 customers in total. Out of these 7 customers, 4 didn't leave a tip. So, the number of customers who left a tip is 7 - 4 = 3. The waiter got $9 each from the customers who left a tip. So, the total amount of money he earned from these customers is 3 x $9 = $27. Therefore, the waiter earned $27 in total.",
36 | "pred_ans": "27",
37 | "gold_ans": "27"
38 | },
39 | {
40 | "question": "Q: Mike made 69 dollars mowing lawns over the summer. If he spent 24 dollars buying new mower blades, how many 5 dollar games could he buy with the money he had left?\nA:",
41 | "rationale": "Let's think step by step. First, we need to find out how much money Mike has left after buying the new mower blades. We can do this by subtracting the cost of the blades from the amount of money he made: 69 dollars - 24 dollars = 45 dollars Now we know that Mike has 45 dollars left to spend on games. To find out how many 5 dollar games he can buy, we can divide the amount of money he has left by the cost of each game: 45 dollars ÷ 5 dollars/game = 9 games Therefore, Mike can buy 9 5-dollar games with the money he has left after buying the new mower blades.",
42 | "pred_ans": "9",
43 | "gold_ans": "9"
44 | },
45 | {
46 | "question": "Q: Wendy uploaded 45 pictures to Facebook. She put 27 pics into one album and put the rest into 9 different albums. How many pictures were in each album?\nA:",
47 | "rationale": "Let's think step by step. First, we know that Wendy put 27 pictures into one album. So, we subtract 27 from the total number of pictures to find out how many pictures were left to be distributed among the 9 albums. 45 - 27 = 18 Now we need to divide the remaining 18 pictures equally among the 9 albums. 18 ÷ 9 = 2 Therefore, there were 2 pictures in each of the 9 albums.",
48 | "pred_ans": "2",
49 | "gold_ans": "2"
50 | }
51 | ],
52 | "inertia": 234.3535614013672
53 | }
--------------------------------------------------------------------------------
/demos/multiarith_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There are 15 trees in the grove. Grove workers will plant trees in the grove today. After they are done, there will be 21 trees. How many trees did the grove workers plant today?\nA:",
5 | "rationale": "There are 15 trees originally. Then there were 21 trees after some more were planted. So there must have been 21 - 15 = 6.",
6 | "pred_ans": "6"
7 | },
8 | {
9 | "question": "Q: If there are 3 cars in the parking lot and 2 more cars arrive, how many cars are in the parking lot?\nA:",
10 | "rationale": "There are originally 3 cars. 2 more cars arrive. 3 + 2 = 5.",
11 | "pred_ans": "5"
12 | },
13 | {
14 | "question": "Q: Leah had 32 chocolates and her sister had 42. If they ate 35, how many pieces do they have left in total?\nA:",
15 | "rationale": "Originally, Leah had 32 chocolates. Her sister had 42. So in total they had 32 + 42 = 74. After eating 35, they had 74 - 35 = 39.",
16 | "pred_ans": "39"
17 | },
18 | {
19 | "question": "Q: Jason had 20 lollipops. He gave Denny some lollipops. Now Jason has 12 lollipops. How many lollipops did Jason give to Denny?\nA:",
20 | "rationale": "Jason started with 20 lollipops. Then he had 12 after giving some to Denny. So he gave Denny 20 - 12 = 8.",
21 | "pred_ans": "8"
22 | },
23 | {
24 | "question": "Q: Shawn has five toys. For Christmas, he got two toys each from his mom and dad. How many toys does he have now?\nA:",
25 | "rationale": "Shawn started with 5 toys. If he got 2 toys each from his mom and dad, then that is 4 more toys. 5 + 4 = 9.",
26 | "pred_ans": "9"
27 | },
28 | {
29 | "question": "Q: There were nine computers in the server room. Five more computers were installed each day, from monday to thursday. How many computers are now in the server room?\nA:",
30 | "rationale": "There were originally 9 computers. For each of 4 days, 5 more computers were added. So 5 * 4 = 20 computers were added. 9 + 20 is 29.",
31 | "pred_ans": "29"
32 | },
33 | {
34 | "question": "Q: Michael had 58 golf balls. On tuesday, he lost 23 golf balls. On wednesday, he lost 2 more. How many golf balls did he have at the end of wednesday?\nA:",
35 | "rationale": "Michael started with 58 golf balls. After losing 23 on tuesday, he had 58 - 23 = 35. After losing 2 more, he had 35 - 2 = 33 golf balls.",
36 | "pred_ans": "33"
37 | },
38 | {
39 | "question": "Q: Olivia has $23. She bought five bagels for $3 each. How much money does she have left?\nA:",
40 | "rationale": "Olivia had 23 dollars. 5 bagels for 3 dollars each will be 5 x 3 = 15 dollars. So she has 23 - 15 dollars left. 23 - 15 is 8.",
41 | "pred_ans": "8"
42 | }
43 | ]
44 | }
--------------------------------------------------------------------------------
/demos/singleeq_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Nancy has 9 five dollars bills. How much money does she have ?\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. Nancy has 9 five dollar bills. So, we can start by multiplying 9 by 5 to find out how much money she has in total. 9 x 5 = 45 Therefore, Nancy has $45 in total.",
6 | "pred_ans": "45",
7 | "gold_ans": "45"
8 | },
9 | {
10 | "question": "Q: Nancy has 7 black balloons. Mary has 4 times more black balloons than Nancy. How many black balloons does Mary have now ?\nA:",
11 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find out how many black balloons Mary has. We know that Mary has 4 times more black balloons than Nancy, so we can start by multiplying Nancy's number of black balloons by 4. 4 x 7 = 28 So Mary has 28 black balloons. Therefore, Mary has 28 black balloons now.",
12 | "pred_ans": "28",
13 | "gold_ans": "28"
14 | },
15 | {
16 | "question": "Q: Sally picked 7 lemons and Mary picked 9 lemons from the lemon tree. How many lemons were picked in total ?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to add the number of lemons Sally picked (7) to the number of lemons Mary picked (9). 7 + 9 = 16 So, in total, 16 lemons were picked.",
18 | "pred_ans": "16",
19 | "gold_ans": "16"
20 | },
21 | {
22 | "question": "Q: A teacher has 344 pieces of candy. If there are 43 students, and the candy is divided evenly, How many pieces will each student get?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to divide the total number of candy pieces (344) by the number of students (43) to find out how many pieces each student will get. So, 344 ÷ 43 = 8 Therefore, each student will get 8 pieces of candy.",
24 | "pred_ans": "8",
25 | "gold_ans": "8"
26 | },
27 | {
28 | "question": "Q: Joan has 10 books. Tom has 38 books. How many books do they have together ?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of books Joan and Tom have. Joan has 10 books and Tom has 38 books, so: 10 + 38 = 48 Therefore, Joan and Tom have 48 books together.",
30 | "pred_ans": "48",
31 | "gold_ans": "48"
32 | },
33 | {
34 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins. How many pounds of snacks did she buy in all?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
36 | "pred_ans": "0.5",
37 | "gold_ans": "0.5"
38 | },
39 | {
40 | "question": "Q: Alyssa's high school played 31 hockey games this year. She attended 13 games. How many hockey games did Alyssa miss ?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. We know that Alyssa attended 13 hockey games out of 31 total games played by her high school team. To find out how many games she missed, we can subtract the number of games she attended from the total number of games played: 31 - 13 = 18 Therefore, Alyssa missed 18 hockey games.",
42 | "pred_ans": "18",
43 | "gold_ans": "18"
44 | },
45 | {
46 | "question": "Q: Stanley ran 0.4 of a mile and walked 0.2 of a mile. How much farther did Stanley run than walk?\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find the difference between the distance Stanley ran and walked. To do this, we can subtract the distance he walked from the distance he ran: 0.4 - 0.2 = 0.2 So Stanley ran 0.2 miles farther than he walked.",
48 | "pred_ans": "0.2",
49 | "gold_ans": "0.2"
50 | }
51 | ]
52 | }
--------------------------------------------------------------------------------
/demos/singleeq_gpt-3.5-turbo-0301_10:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Tom found 5 seashells on the beach. he gave Jessica 2 of the seashells. How many seashells does he now have ?\nA:",
5 | "rationale": "Let's think step by step. Tom had 5 seashells initially. He gave 2 seashells to Jessica. So, the number of seashells Tom has now is: 5 - 2 = 3 Therefore, Tom now has 3 seashells.",
6 | "pred_ans": "3",
7 | "gold_ans": "3"
8 | },
9 | {
10 | "question": "Q: Alyssa has 36 books. Nancy has 7 times more books than Alyssa. How many books does Nancy have ?\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to find out how many books Nancy has compared to Alyssa. To do this, we can multiply Alyssa's number of books by 7: 36 x 7 = 252 So Nancy has 252 books.",
12 | "pred_ans": "252",
13 | "gold_ans": "252"
14 | },
15 | {
16 | "question": "Q: Ellen went to a garage sale to buy chairs. Each chair is 15 dollars. How much did Ellen spend for the 12 chairs she bought?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. Ellen bought 12 chairs and each chair costs $15. So, we can multiply the number of chairs by the cost of each chair: 12 x $15 = $180 Therefore, Ellen spent $180 for the 12 chairs she bought.",
18 | "pred_ans": "180",
19 | "gold_ans": "180"
20 | },
21 | {
22 | "question": "Q: Stanley ran 0.4 of a mile and walked 0.2 of a mile. How much farther did Stanley run than walk?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find the difference between the distance Stanley ran and walked. To do this, we can subtract the distance he walked from the distance he ran: 0.4 - 0.2 = 0.2 So Stanley ran 0.2 miles farther than he walked.",
24 | "pred_ans": "0.2",
25 | "gold_ans": "0.2"
26 | },
27 | {
28 | "question": "Q: There are 107 walnut trees currently in the park. Park workers will plant 104 more walnut trees today. How many walnut trees will the park have when the workers are finished ?\nA:",
29 | "rationale": "Let's think step by step. First, we need to add the number of walnut trees currently in the park (107) to the number of walnut trees the workers will plant today (104). So, 107 + 104 = 211 Therefore, the park will have 211 walnut trees when the workers are finished planting.",
30 | "pred_ans": "211",
31 | "gold_ans": "211"
32 | },
33 | {
34 | "question": "Q: Benny picked 2 apples and Dan picked 9 apples from the apple tree. How many apples were picked in total ?\nA:",
35 | "rationale": "Let's think step by step. First, we need to add the number of apples Benny picked (2) to the number of apples Dan picked (9). 2 + 9 = 11 Therefore, the total number of apples picked is 11.",
36 | "pred_ans": "11",
37 | "gold_ans": "11"
38 | },
39 | {
40 | "question": "Q: Sally bought 4 dozen eggs from the grocery store to bake some cakes. How many eggs did Sally buy ?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to know how many eggs are in a dozen. A dozen is equal to 12, so 4 dozen would be: 4 x 12 = 48 Therefore, Sally bought 48 eggs from the grocery store.",
42 | "pred_ans": "48",
43 | "gold_ans": "48"
44 | },
45 | {
46 | "question": "Q: Sara had 21 quarters in her bank. Her dad gave her 49 more quarters. How many quarters does she have now ?\nA:",
47 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the total number of quarters Sara has after her dad gave her 49 more quarters. To do this, we can add the number of quarters she had before to the number of quarters her dad gave her. So, the total number of quarters Sara has now is: 21 + 49 = 70 Therefore, Sara has 70 quarters now.",
48 | "pred_ans": "70",
49 | "gold_ans": "70"
50 | },
51 | {
52 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins. How many pounds of snacks did she buy in all?\nA:",
53 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
54 | "pred_ans": "0.5",
55 | "gold_ans": "0.5"
56 | },
57 | {
58 | "question": "Q: Alyssa's high school played 31 hockey games this year. She attended 13 games. How many hockey games did Alyssa miss ?\nA:",
59 | "rationale": "Let's think step by step. Sure, let's break it down. We know that Alyssa attended 13 hockey games out of 31 total games played by her high school team. To find out how many games she missed, we can subtract the number of games she attended from the total number of games played: 31 - 13 = 18 Therefore, Alyssa missed 18 hockey games.",
60 | "pred_ans": "18",
61 | "gold_ans": "18"
62 | }
63 | ],
64 | "inertia": 231.68568420410156
65 | }
--------------------------------------------------------------------------------
/demos/singleeq_gpt-3.5-turbo-0301_11:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Jason has 3 Pokemon cards. Benny bought 2 of Jason's Pokemon cards. How many Pokemon cards does Jason have now ?\nA:",
5 | "rationale": "Let's think step by step. First, we need to find out how many Pokemon cards Jason has after Benny bought 2 of them. If Jason had 3 Pokemon cards and Benny bought 2 of them, then Jason would have 1 Pokemon card left. Therefore, Jason has 1 Pokemon card now.",
6 | "pred_ans": "1",
7 | "gold_ans": "1"
8 | },
9 | {
10 | "question": "Q: Willy has 1400 crayons. Lucy has 290 crayons. How many more crayons does Willy have then Lucy?\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to find the difference between the number of crayons Willy has and the number of crayons Lucy has. To do this, we can subtract the number of crayons Lucy has from the number of crayons Willy has: 1400 - 290 = 1110 So, Willy has 1110 more crayons than Lucy.",
12 | "pred_ans": "1110",
13 | "gold_ans": "1110"
14 | },
15 | {
16 | "question": "Q: Sara had 21 quarters in her bank. Her dad gave her 49 more quarters. How many quarters does she have now ?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the total number of quarters Sara has after her dad gave her 49 more quarters. To do this, we can add the number of quarters she had before to the number of quarters her dad gave her. So, the total number of quarters Sara has now is: 21 + 49 = 70 Therefore, Sara has 70 quarters now.",
18 | "pred_ans": "70",
19 | "gold_ans": "70"
20 | },
21 | {
22 | "question": "Q: Ellen went to a garage sale to buy chairs. Each chair is 15 dollars. How much did Ellen spend for the 12 chairs she bought?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. Ellen bought 12 chairs and each chair costs $15. So, we can multiply the number of chairs by the cost of each chair: 12 x $15 = $180 Therefore, Ellen spent $180 for the 12 chairs she bought.",
24 | "pred_ans": "180",
25 | "gold_ans": "180"
26 | },
27 | {
28 | "question": "Q: Stanley ran 0.4 of a mile and walked 0.2 of a mile. How much farther did Stanley run than walk?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find the difference between the distance Stanley ran and walked. To do this, we can subtract the distance he walked from the distance he ran: 0.4 - 0.2 = 0.2 So Stanley ran 0.2 miles farther than he walked.",
30 | "pred_ans": "0.2",
31 | "gold_ans": "0.2"
32 | },
33 | {
34 | "question": "Q: Tom found 5 seashells on the beach. he gave Jessica 2 of the seashells. How many seashells does he now have ?\nA:",
35 | "rationale": "Let's think step by step. Tom had 5 seashells initially. He gave 2 seashells to Jessica. So, the number of seashells Tom has now is: 5 - 2 = 3 Therefore, Tom now has 3 seashells.",
36 | "pred_ans": "3",
37 | "gold_ans": "3"
38 | },
39 | {
40 | "question": "Q: Bryan took a look at his books as well. If Bryan has 56 books in each of his 9 bookshelves, how many books does he have in total?\nA:",
41 | "rationale": "Let's think step by step. First, we can find out how many books Bryan has in one bookshelf by multiplying the number of books in each bookshelf by the number of bookshelves: 56 books/bookshelf x 9 bookshelves = 504 books So Bryan has 504 books in total.",
42 | "pred_ans": "504",
43 | "gold_ans": "504"
44 | },
45 | {
46 | "question": "Q: Benny picked 2 apples and Dan picked 9 apples from the apple tree. How many apples were picked in total ?\nA:",
47 | "rationale": "Let's think step by step. First, we need to add the number of apples Benny picked (2) to the number of apples Dan picked (9). 2 + 9 = 11 Therefore, the total number of apples picked is 11.",
48 | "pred_ans": "11",
49 | "gold_ans": "11"
50 | },
51 | {
52 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins. How many pounds of snacks did she buy in all?\nA:",
53 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
54 | "pred_ans": "0.5",
55 | "gold_ans": "0.5"
56 | },
57 | {
58 | "question": "Q: Alyssa's high school played 31 hockey games this year. She attended 13 games. How many hockey games did Alyssa miss ?\nA:",
59 | "rationale": "Let's think step by step. Sure, let's break it down. We know that Alyssa attended 13 hockey games out of 31 total games played by her high school team. To find out how many games she missed, we can subtract the number of games she attended from the total number of games played: 31 - 13 = 18 Therefore, Alyssa missed 18 hockey games.",
60 | "pred_ans": "18",
61 | "gold_ans": "18"
62 | },
63 | {
64 | "question": "Q: There are 107 walnut trees currently in the park. Park workers will plant 104 more walnut trees today. How many walnut trees will the park have when the workers are finished ?\nA:",
65 | "rationale": "Let's think step by step. First, we need to add the number of walnut trees currently in the park (107) to the number of walnut trees the workers will plant today (104). So, 107 + 104 = 211 Therefore, the park will have 211 walnut trees when the workers are finished planting.",
66 | "pred_ans": "211",
67 | "gold_ans": "211"
68 | }
69 | ],
70 | "inertia": 226.80731201171875
71 | }
--------------------------------------------------------------------------------
/demos/singleeq_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Nancy has 9 five dollars bills. How much money does she have ?\nA:",
5 | "rationale": "Let's think step by step. Sure, let's break it down. Nancy has 9 five dollar bills. So, we can start by multiplying 9 by 5 to find out how much money she has in total. 9 x 5 = 45 Therefore, Nancy has $45 in total.",
6 | "pred_ans": "45",
7 | "gold_ans": "45"
8 | },
9 | {
10 | "question": "Q: Nancy has 7 black balloons. Mary has 4 times more black balloons than Nancy. How many black balloons does Mary have now ?\nA:",
11 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find out how many black balloons Mary has. We know that Mary has 4 times more black balloons than Nancy, so we can start by multiplying Nancy's number of black balloons by 4. 4 x 7 = 28 So Mary has 28 black balloons. Therefore, Mary has 28 black balloons now.",
12 | "pred_ans": "28",
13 | "gold_ans": "28"
14 | },
15 | {
16 | "question": "Q: Sally picked 7 lemons and Mary picked 9 lemons from the lemon tree. How many lemons were picked in total ?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to add the number of lemons Sally picked (7) to the number of lemons Mary picked (9). 7 + 9 = 16 So, in total, 16 lemons were picked.",
18 | "pred_ans": "16",
19 | "gold_ans": "16"
20 | },
21 | {
22 | "question": "Q: A teacher has 344 pieces of candy. If there are 43 students, and the candy is divided evenly, How many pieces will each student get?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to divide the total number of candy pieces (344) by the number of students (43) to find out how many pieces each student will get. So, 344 ÷ 43 = 8 Therefore, each student will get 8 pieces of candy.",
24 | "pred_ans": "8",
25 | "gold_ans": "8"
26 | },
27 | {
28 | "question": "Q: Joan has 10 books. Tom has 38 books. How many books do they have together ?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of books Joan and Tom have. Joan has 10 books and Tom has 38 books, so: 10 + 38 = 48 Therefore, Joan and Tom have 48 books together.",
30 | "pred_ans": "48",
31 | "gold_ans": "48"
32 | },
33 | {
34 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins. How many pounds of snacks did she buy in all?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
36 | "pred_ans": "0.5",
37 | "gold_ans": "0.5"
38 | },
39 | {
40 | "question": "Q: Alyssa's high school played 31 hockey games this year. She attended 13 games. How many hockey games did Alyssa miss ?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. We know that Alyssa attended 13 hockey games out of 31 total games played by her high school team. To find out how many games she missed, we can subtract the number of games she attended from the total number of games played: 31 - 13 = 18 Therefore, Alyssa missed 18 hockey games.",
42 | "pred_ans": "18",
43 | "gold_ans": "18"
44 | },
45 | {
46 | "question": "Q: Stanley ran 0.4 of a mile and walked 0.2 of a mile. How much farther did Stanley run than walk?\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find the difference between the distance Stanley ran and walked. To do this, we can subtract the distance he walked from the distance he ran: 0.4 - 0.2 = 0.2 So Stanley ran 0.2 miles farther than he walked.",
48 | "pred_ans": "0.2",
49 | "gold_ans": "0.2"
50 | }
51 | ],
52 | "inertia": 237.8219451904297
53 | }
--------------------------------------------------------------------------------
/demos/singleeq_gpt-3.5-turbo-0301_9:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Sara had 21 quarters in her bank. Her dad gave her 49 more quarters. How many quarters does she have now ?\nA:",
5 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the total number of quarters Sara has after her dad gave her 49 more quarters. To do this, we can add the number of quarters she had before to the number of quarters her dad gave her. So, the total number of quarters Sara has now is: 21 + 49 = 70 Therefore, Sara has 70 quarters now.",
6 | "pred_ans": "70",
7 | "gold_ans": "70"
8 | },
9 | {
10 | "question": "Q: Ellen went to a garage sale to buy chairs. Each chair is 15 dollars. How much did Ellen spend for the 12 chairs she bought?\nA:",
11 | "rationale": "Let's think step by step. Sure, let's break it down. Ellen bought 12 chairs and each chair costs $15. So, we can multiply the number of chairs by the cost of each chair: 12 x $15 = $180 Therefore, Ellen spent $180 for the 12 chairs she bought.",
12 | "pred_ans": "180",
13 | "gold_ans": "180"
14 | },
15 | {
16 | "question": "Q: Dan has 64 violet marbles, he gave Mary 14 of the marbles. How many violet marbles does he now have ?\nA:",
17 | "rationale": "Let's think step by step. First, we need to subtract the number of marbles Dan gave to Mary from the total number of marbles he had before giving any away. 64 - 14 = 50 Therefore, Dan now has 50 violet marbles.",
18 | "pred_ans": "50",
19 | "gold_ans": "50"
20 | },
21 | {
22 | "question": "Q: Kelly bought 0.1 pounds of peanuts and 0.4 pounds of raisins. How many pounds of snacks did she buy in all?\nA:",
23 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the weight of peanuts and raisins to find the total weight of snacks. 0.1 pounds (peanuts) + 0.4 pounds (raisins) = 0.5 pounds Therefore, Kelly bought 0.5 pounds of snacks in all.",
24 | "pred_ans": "0.5",
25 | "gold_ans": "0.5"
26 | },
27 | {
28 | "question": "Q: Alyssa has 36 books. Nancy has 7 times more books than Alyssa. How many books does Nancy have ?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to find out how many books Nancy has compared to Alyssa. To do this, we can multiply Alyssa's number of books by 7: 36 x 7 = 252 So Nancy has 252 books.",
30 | "pred_ans": "252",
31 | "gold_ans": "252"
32 | },
33 | {
34 | "question": "Q: Sandy grew 51 pumpkins. Mike grew 23 pumpkins. How many pumpkins did they grow in total ?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to add the number of pumpkins Sandy grew and the number of pumpkins Mike grew. 51 + 23 = 74 So, they grew a total of 74 pumpkins.",
36 | "pred_ans": "74",
37 | "gold_ans": "74"
38 | },
39 | {
40 | "question": "Q: Stanley ran 0.4 of a mile and walked 0.2 of a mile. How much farther did Stanley run than walk?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down step by step. First, we need to find the difference between the distance Stanley ran and walked. To do this, we can subtract the distance he walked from the distance he ran: 0.4 - 0.2 = 0.2 So Stanley ran 0.2 miles farther than he walked.",
42 | "pred_ans": "0.2",
43 | "gold_ans": "0.2"
44 | },
45 | {
46 | "question": "Q: There are 33 oak trees currently in the park. Park workers had to cut down 18 oak trees that were damaged. How many oak trees will be in the park when the workers are finished ?\nA:",
47 | "rationale": "Let's think step by step. First, we start with the total number of oak trees in the park, which is 33. Then, we subtract the number of oak trees that were cut down, which is 18. So, the number of oak trees that will be left in the park after the workers are finished is: 33 - 18 = 15 Therefore, there will be 15 oak trees in the park when the workers are finished.",
48 | "pred_ans": "15",
49 | "gold_ans": "15"
50 | },
51 | {
52 | "question": "Q: Melanie, Benny, Sally, and Jessica each have 3 baseball cards. How many baseball cards do they have in all ?\nA:",
53 | "rationale": "Let's think step by step. Sure, let's break it down. We know that Melanie has 3 baseball cards, Benny has 3 baseball cards, Sally has 3 baseball cards, and Jessica has 3 baseball cards. To find out how many baseball cards they have in all, we can add up the number of cards each person has: 3 + 3 + 3 + 3 = 12 So, in total, they have 12 baseball cards.",
54 | "pred_ans": "12",
55 | "gold_ans": "12"
56 | }
57 | ],
58 | "inertia": 234.65257263183594
59 | }
--------------------------------------------------------------------------------
/demos/singleeq_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There are 15 trees in the grove. Grove workers will plant trees in the grove today. After they are done, there will be 21 trees. How many trees did the grove workers plant today?\nA:",
5 | "rationale": "There are 15 trees originally. Then there were 21 trees after some more were planted. So there must have been 21 - 15 = 6.",
6 | "pred_ans": "6"
7 | },
8 | {
9 | "question": "Q: If there are 3 cars in the parking lot and 2 more cars arrive, how many cars are in the parking lot?\nA:",
10 | "rationale": "There are originally 3 cars. 2 more cars arrive. 3 + 2 = 5.",
11 | "pred_ans": "5"
12 | },
13 | {
14 | "question": "Q: Leah had 32 chocolates and her sister had 42. If they ate 35, how many pieces do they have left in total?\nA:",
15 | "rationale": "Originally, Leah had 32 chocolates. Her sister had 42. So in total they had 32 + 42 = 74. After eating 35, they had 74 - 35 = 39.",
16 | "pred_ans": "39"
17 | },
18 | {
19 | "question": "Q: Jason had 20 lollipops. He gave Denny some lollipops. Now Jason has 12 lollipops. How many lollipops did Jason give to Denny?\nA:",
20 | "rationale": "Jason started with 20 lollipops. Then he had 12 after giving some to Denny. So he gave Denny 20 - 12 = 8.",
21 | "pred_ans": "8"
22 | },
23 | {
24 | "question": "Q: Shawn has five toys. For Christmas, he got two toys each from his mom and dad. How many toys does he have now?\nA:",
25 | "rationale": "Shawn started with 5 toys. If he got 2 toys each from his mom and dad, then that is 4 more toys. 5 + 4 = 9.",
26 | "pred_ans": "9"
27 | },
28 | {
29 | "question": "Q: There were nine computers in the server room. Five more computers were installed each day, from monday to thursday. How many computers are now in the server room?\nA:",
30 | "rationale": "There were originally 9 computers. For each of 4 days, 5 more computers were added. So 5 * 4 = 20 computers were added. 9 + 20 is 29.",
31 | "pred_ans": "29"
32 | },
33 | {
34 | "question": "Q: Michael had 58 golf balls. On tuesday, he lost 23 golf balls. On wednesday, he lost 2 more. How many golf balls did he have at the end of wednesday?\nA:",
35 | "rationale": "Michael started with 58 golf balls. After losing 23 on tuesday, he had 58 - 23 = 35. After losing 2 more, he had 35 - 2 = 33 golf balls.",
36 | "pred_ans": "33"
37 | },
38 | {
39 | "question": "Q: Olivia has $23. She bought five bagels for $3 each. How much money does she have left?\nA:",
40 | "rationale": "Olivia had 23 dollars. 5 bagels for 3 dollars each will be 5 x 3 = 15 dollars. So she has 23 - 15 dollars left. 23 - 15 is 8.",
41 | "pred_ans": "8"
42 | }
43 | ]
44 | }
--------------------------------------------------------------------------------
/demos/strategyqa_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Would a vegetarian be able to eat something at Chick-fil-A?\nA:",
5 | "rationale": "Let's think step by step. Chick-fil-A is a fast-food restaurant that primarily serves chicken-based dishes. However, they do offer some vegetarian options such as their side salad, waffle potato fries, and their fruit cup. They also have a grilled chicken cool wrap that can be made without chicken for a vegetarian option. However, it's important to note that Chick-fil-A uses the same fryer for both their chicken and their waffle fries, so cross-contamination may occur. Therefore, it's best to ask the staff about their preparation methods and ingredients to ensure that the food is suitable for a vegetarian diet.",
6 | "pred_ans": "yes",
7 | "gold_ans": "yes"
8 | },
9 | {
10 | "question": "Q: Did Julia Roberts practice blast beats as a child?\nA:",
11 | "rationale": "Let's think step by step. I'm sorry, but that question is not related to math. As a math assistant, I can help you with any math-related questions or problems you may have. Please let me know how I can assist you.",
12 | "pred_ans": "no",
13 | "gold_ans": "no"
14 | },
15 | {
16 | "question": "Q: Could someone in Tokyo take a taxi to the The Metropolitan Museum of Art?\nA:",
17 | "rationale": "Let's think step by step. Sure, we can break down the problem into smaller parts to find the answer. First, we need to determine the distance between Tokyo and The Metropolitan Museum of Art. The Metropolitan Museum of Art is located in New York City, USA, so we need to find the distance between Tokyo and New York City. The distance between Tokyo and New York City is approximately 6,735 miles (10,840 kilometers). Next, we need to determine if it is possible to take a taxi from Tokyo to The Metropolitan Museum of Art. Unfortunately, it is not possible to take a taxi from Tokyo to The Metropolitan Museum of Art as they are located on different continents and separated by an ocean. Therefore, it is not possible for someone in Tokyo to take a taxi to The Metropolitan Museum of Art.",
18 | "pred_ans": "no",
19 | "gold_ans": "no"
20 | },
21 | {
22 | "question": "Q: Will Queen Elizabeth be buried in the Pantheon?\nA:",
23 | "rationale": "Let's think step by step. As a math assistant, I don't have information about the burial plans of Queen Elizabeth. However, I can tell you that the Pantheon is a famous ancient temple in Rome that was converted into a church. It is the final resting place of many famous Italians, including the artist Raphael. It is unlikely that Queen Elizabeth will be buried there as she is not Italian and has no direct connection to the Pantheon.",
24 | "pred_ans": "no",
25 | "gold_ans": "no"
26 | },
27 | {
28 | "question": "Q: Would a goblin shark eat at Crossroads Kitchen?\nA:",
29 | "rationale": "Let's think step by step. First, we need to understand what a goblin shark is and what it eats. A goblin shark is a deep-sea shark that primarily feeds on fish and cephalopods. Next, we need to understand what Crossroads Kitchen is. Crossroads Kitchen is a vegan restaurant in Los Angeles that serves plant-based dishes. Based on this information, it is highly unlikely that a goblin shark would eat at Crossroads Kitchen since it primarily feeds on fish and cephalopods, which are not served at the restaurant. Additionally, since Crossroads Kitchen is a vegan restaurant, it does not serve any animal products, which would not be suitable for a goblin shark's diet.",
30 | "pred_ans": "no",
31 | "gold_ans": "no"
32 | },
33 | {
34 | "question": "Q: Did the 40th president of the United States forward lolcats to his friends?\nA:",
35 | "rationale": "Let's think step by step. First, we need to identify who the 40th president of the United States was. The 40th president was Ronald Reagan. Next, we need to determine if forwarding lolcats to friends was something that was possible during Reagan's presidency. Lolcats, or funny cat pictures with captions, became popular on the internet in the early 2000s, which was after Reagan's presidency ended in 1989. Therefore, it is unlikely that Reagan forwarded lolcats to his friends during his presidency. In conclusion, it is highly unlikely that the 40th president of the United States forwarded lolcats to his friends.",
36 | "pred_ans": "no",
37 | "gold_ans": "no"
38 | }
39 | ]
40 | }
--------------------------------------------------------------------------------
/demos/strategyqa_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Did Dr. Seuss make himself famous?\nA:",
5 | "rationale": "Let's think step by step. Dr. Seuss, whose real name was Theodor Seuss Geisel, became famous for his children's books such as \"The Cat in the Hat,\" \"Green Eggs and Ham,\" and \"How the Grinch Stole Christmas.\" He wrote and illustrated over 60 books during his career, which spanned several decades. So, did he make himself famous? In a way, yes. Dr. Seuss's unique style of writing and illustration set him apart from other children's book authors of his time. He created memorable characters and stories that captured the imaginations of children and adults alike. However, he also had help from publishers, editors, and other professionals in the book industry who helped promote his work and bring it to a wider audience. Ultimately, it was a combination of Dr. Seuss's talent and hard work, along with the support of others in the industry, that led to his fame and success.",
6 | "pred_ans": "yes",
7 | "gold_ans": "no"
8 | },
9 | {
10 | "question": "Q: Did the 40th president of the United States forward lolcats to his friends?\nA:",
11 | "rationale": "Let's think step by step. First, we need to identify who the 40th president of the United States was. The 40th president was Ronald Reagan. Next, we need to determine if forwarding lolcats to friends was something that was possible during Reagan's presidency. Lolcats, or funny cat pictures with captions, became popular on the internet in the early 2000s, which was after Reagan's presidency ended in 1989. Therefore, it is unlikely that Reagan forwarded lolcats to his friends during his presidency. In conclusion, it is highly unlikely that the 40th president of the United States forwarded lolcats to his friends.",
12 | "pred_ans": "no",
13 | "gold_ans": "no"
14 | },
15 | {
16 | "question": "Q: Did Christopher Columbus go to Antarctica?\nA:",
17 | "rationale": "Let's think step by step. Christopher Columbus is known for his voyages across the Atlantic Ocean, but he did not travel to Antarctica. Columbus lived in the 15th century, and Antarctica was not discovered until the 19th century. Additionally, Antarctica is located at the southernmost point of the Earth, while Columbus traveled to the Americas, which are located in the northern hemisphere.",
18 | "pred_ans": "no",
19 | "gold_ans": "no"
20 | },
21 | {
22 | "question": "Q: Are honey badgers and hyenas anatomically dissimilar?\nA:",
23 | "rationale": "Let's think step by step. As a math assistant, I can tell you that honey badgers and hyenas are two different species of animals and therefore have different anatomical structures. However, if you have a specific question about their anatomical differences, I can try to help you find the answer.",
24 | "pred_ans": "yes",
25 | "gold_ans": "no"
26 | },
27 | {
28 | "question": "Q: Can monkeys use QWERTY keyboards?\nA:",
29 | "rationale": "Let's think step by step. First, we need to understand what a QWERTY keyboard is. It is a keyboard layout that is commonly used for English language typing. Next, we need to consider the physical abilities of monkeys. While monkeys are intelligent animals, they do not have the same level of fine motor skills as humans. They may struggle to accurately press individual keys on a keyboard. Additionally, monkeys may not have the cognitive ability to understand the purpose of a keyboard or how to use it to input information. Therefore, it is unlikely that monkeys would be able to effectively use a QWERTY keyboard.",
30 | "pred_ans": "no",
31 | "gold_ans": "yes"
32 | },
33 | {
34 | "question": "Q: Could Marco Rubio ride the Candymonium roller coaster at Hershey Park?\nA:",
35 | "rationale": "Let's think step by step. First, we need to determine the height requirement for the Candymonium roller coaster at Hershey Park. According to the Hershey Park website, riders must be at least 54 inches tall to ride. Next, we need to find out how tall Marco Rubio is. According to public records, Marco Rubio is 5 feet 10 inches tall, which is equivalent to 70 inches. Since Marco Rubio is taller than the height requirement of 54 inches, he would be able to ride the Candymonium roller coaster at Hershey Park.",
36 | "pred_ans": "yes",
37 | "gold_ans": "yes"
38 | },
39 | {
40 | "question": "Q: Will Queen Elizabeth be buried in the Pantheon?\nA:",
41 | "rationale": "Let's think step by step. As a math assistant, I don't have information about the burial plans of Queen Elizabeth. However, I can tell you that the Pantheon is a famous ancient temple in Rome that was converted into a church. It is the final resting place of many famous Italians, including the artist Raphael. It is unlikely that Queen Elizabeth will be buried there as she is not Italian and has no direct connection to the Pantheon.",
42 | "pred_ans": "no",
43 | "gold_ans": "no"
44 | },
45 | {
46 | "question": "Q: Would a vegetarian be able to eat something at Chick-fil-A?\nA:",
47 | "rationale": "Let's think step by step. Chick-fil-A is a fast-food restaurant that primarily serves chicken-based dishes. However, they do offer some vegetarian options such as their side salad, waffle potato fries, and their fruit cup. They also have a grilled chicken cool wrap that can be made without chicken for a vegetarian option. However, it's important to note that Chick-fil-A uses the same fryer for both their chicken and their waffle fries, so cross-contamination may occur. Therefore, it's best to ask the staff about their preparation methods and ingredients to ensure that the food is suitable for a vegetarian diet.",
48 | "pred_ans": "yes",
49 | "gold_ans": "yes"
50 | }
51 | ],
52 | "inertia": 3594.966552734375
53 | }
--------------------------------------------------------------------------------
/demos/strategyqa_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Do hamsters provide food for any animals?\nA:",
5 | "rationale": "Hamsters are prey animals. Prey are food for predators. Thus, hamsters provide food for some animals. So the answer is yes.",
6 | "pred_ans": "yes"
7 | },
8 | {
9 | "question": "Q: Could Brooke Shields succeed at University of Pennsylvania?\nA:",
10 | "rationale": "Brooke Shields went to Princeton University. Princeton University is about as academically rigorous as the University of Pennsylvania. Thus, Brooke Shields could also succeed at the University of Pennsylvania. So the answer is yes.",
11 | "pred_ans": "yes"
12 | },
13 | {
14 | "question": "Q: Yes or no: Hydrogen’s atomic number squared exceeds number of Spice Girls?\nA:",
15 | "rationale": "Hydrogen has an atomic number of 1. 1 squared is 1. There are 5 Spice Girls. Thus, Hydrogen’s atomic number squared is less than 5. So the answer is no.",
16 | "pred_ans": "no"
17 | },
18 | {
19 | "question": "Q: Yes or no: Is it common to see frost during some college commencements?\nA:",
20 | "rationale": "College commencement ceremonies can happen in December, May, and June. December is in the winter, so there can be frost. Thus, there could be frost at some commencements. So the answer is yes.",
21 | "pred_ans": "yes"
22 | },
23 | {
24 | "question": "Q: Yes or no: Could a llama birth twice during War in Vietnam (1945-46)?\nA:",
25 | "rationale": "The War in Vietnam was 6 months. The gestation period for a llama is 11 months, which is more than 6 months. Thus, a llama could not give birth twice during the War in Vietnam. So the answer is no.",
26 | "pred_ans": "no"
27 | },
28 | {
29 | "question": "Q: Yes or no: Would a pear sink in water?\nA:",
30 | "rationale": "The density of a pear is about 0.6g/cm3, which is less than water. Objects less dense than water float. Thus, a pear would float. So the answer is no.",
31 | "pred_ans": "no"
32 | }
33 | ]
34 | }
--------------------------------------------------------------------------------
/demos/svamp_gpt-3.5-turbo-0301:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: 28 children were riding on the bus. At the bus stop 82 children got on the bus while some got off the bus. Then there were 30 children altogether on the bus. How many more children got on the bus than those that got off?\nA:",
5 | "rationale": "Let's think step by step. First, we need to find out how many children got off the bus. We know that there were 28 children on the bus before the stop, and 82 got on, so there were 28 + 82 = 110 children on the bus at the stop. Next, we subtract the number of children on the bus after the stop (30) from the number of children on the bus at the stop (110) to find out how many got off: 110 - 30 = 80. Therefore, 80 children got off the bus. Finally, we subtract the number of children who got off the bus (80) from the number of children who got on the bus (82) to find out how many more got on than got off: 82 - 80 = 2. Therefore, 2 more children got on the bus than got off.",
6 | "pred_ans": "2",
7 | "gold_ans": "2"
8 | },
9 | {
10 | "question": "Q: Danny collects bottle caps and wrappers. He found 22 bottle caps and 30 wrappers at the park. Now he has 17 bottle caps and 57 wrappers in his collection. How many wrappers did danny have at first?\nA:",
11 | "rationale": "Let's think step by step. First, we need to find out how many bottle caps and wrappers Danny had at first. We can do this by adding the number of bottle caps and wrappers he found at the park to the number he has in his collection now: Initial number of bottle caps = 22 + 17 = 39 Initial number of wrappers = 30 + 57 = 87 Therefore, Danny had 87 wrappers at first.",
12 | "pred_ans": "87",
13 | "gold_ans": "27"
14 | },
15 | {
16 | "question": "Q: Jerry had 8 action figures and 9 books on a shelf in his room. Later he added 10 more books to the shelf. How many books were on his shelf in all?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the total number of books Jerry had on the shelf before adding 10 more books. We know that he had 9 books on the shelf initially, so we add that to the number of books he added later: 9 + 10 = 19 So, Jerry had 19 books on the shelf after adding 10 more books.",
18 | "pred_ans": "19",
19 | "gold_ans": "19"
20 | },
21 | {
22 | "question": "Q: Bobby had 21 pieces of candy. He ate 5 pieces of candy. Then he ate 9 more. How many pieces of candy does he still have left?\nA:",
23 | "rationale": "Let's think step by step. First, Bobby had 21 pieces of candy. Then he ate 5 pieces of candy, so he now has 21 - 5 = 16 pieces of candy left. After that, he ate 9 more pieces of candy, so he now has 16 - 9 = 7 pieces of candy left. Therefore, Bobby has 7 pieces of candy left.",
24 | "pred_ans": "7",
25 | "gold_ans": "7"
26 | },
27 | {
28 | "question": "Q: Jake has 3 fewer peaches and 4 more apples than Steven. Steven has 19 apples and 15 peaches. How many more apples than peaches does Steven have?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find out how many apples and peaches Jake has. We know that Jake has 3 fewer peaches than Steven, so Jake has 15 - 3 = 12 peaches. We also know that Jake has 4 more apples than Steven, so Jake has 19 + 4 = 23 apples. Next, we need to find out how many more apples than peaches Steven has. Steven has 19 apples and 15 peaches, so he has 19 - 15 = 4 more apples than peaches. Therefore, Steven has 4 more apples than peaches.",
30 | "pred_ans": "4",
31 | "gold_ans": "4"
32 | },
33 | {
34 | "question": "Q: The grasshopper and the frog had a jumping contest. The frog jumped 39 inches and the grasshopper jumped 17 inches. How much farther did the frog jump than the grasshopper?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down step by step. Step 1: Find the difference between the two jumps. To find how much farther the frog jumped than the grasshopper, we need to subtract the length of the grasshopper's jump from the length of the frog's jump. 39 inches - 17 inches = 22 inches Therefore, the frog jumped 22 inches farther than the grasshopper.",
36 | "pred_ans": "22",
37 | "gold_ans": "22"
38 | },
39 | {
40 | "question": "Q: Mary is baking a cake. The recipe calls for 9 cups of flour and 5 cups of sugar. She already put in 3 cups of flour and 62 cups of sugar. How many more cups of flour does she need to add?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. Mary needs a total of 9 cups of flour for the recipe, and she has already added 3 cups. So, she still needs to add 9 - 3 = 6 cups of flour. Therefore, Mary needs to add 6 more cups of flour to complete the recipe.",
42 | "pred_ans": "6",
43 | "gold_ans": "6"
44 | },
45 | {
46 | "question": "Q: Every day Ryan spends 6 hours on learning english and 7 hours on learning chinese. How many more hours does he spend on learning chinese than he does on learning english?\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to find the difference between the number of hours Ryan spends on learning Chinese and English. To do this, we can subtract the number of hours he spends on learning English from the number of hours he spends on learning Chinese: 7 hours (Chinese) - 6 hours (English) = 1 hour Therefore, Ryan spends 1 more hour on learning Chinese than he does on learning English.",
48 | "pred_ans": "1",
49 | "gold_ans": "1"
50 | }
51 | ]
52 | }
--------------------------------------------------------------------------------
/demos/svamp_gpt-3.5-turbo-0301_10:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: Randy has 37 blocks. He uses 33 blocks to build a tower and 13 blocks to build a house. How many more blocks did he use to build the tower than he did to build the house?\nA:",
5 | "rationale": "Let's think step by step. First, we need to find out how many blocks Randy used to build the tower minus how many blocks he used to build the house. Tower blocks: 33 House blocks: 13 33 - 13 = 20 Therefore, Randy used 20 more blocks to build the tower than he did to build the house.",
6 | "pred_ans": "20",
7 | "gold_ans": "20"
8 | },
9 | {
10 | "question": "Q: Tiffany was collecting cans for recycling. On monday she had 3 bags of cans. The next day she found 7 more bags of cans and 44 bags of bottles. How many bags of cans did she have altogether?\nA:",
11 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we know that on Monday, Tiffany had 3 bags of cans. Next, we know that the next day, she found 7 more bags of cans. So, she now has 3 + 7 = 10 bags of cans. Finally, we need to add the 44 bags of bottles that she found to the 10 bags of cans that she now has. So, Tiffany has a total of 10 + 44 = 54 bags of cans and bottles altogether. Therefore, Tiffany has 54 bags of cans and bottles altogether.",
12 | "pred_ans": "54",
13 | "gold_ans": "10"
14 | },
15 | {
16 | "question": "Q: In a school there are 632 girls and 410 boys. 465 more girls joined the school. How many more girls than boys does the school have?\nA:",
17 | "rationale": "Let's think step by step. First, we need to find the total number of girls in the school after 465 more girls joined. 632 (original number of girls) + 465 (new girls) = 1097 girls Next, we can find the difference between the number of girls and boys: 1097 (girls) - 410 (boys) = 687 Therefore, the school has 687 more girls than boys.",
18 | "pred_ans": "687",
19 | "gold_ans": "687"
20 | },
21 | {
22 | "question": "Q: Baker made 54 cakes. He sold some of them. If he still has 13 cakes left How many cakes did baker sell?\nA:",
23 | "rationale": "Let's think step by step. First, we know that Baker made 54 cakes. Then, we know that he sold some of them and has 13 cakes left. To find out how many cakes Baker sold, we can subtract the number of cakes he has left from the total number of cakes he made: 54 - 13 = 41 Therefore, Baker sold 41 cakes.",
24 | "pred_ans": "41",
25 | "gold_ans": "41"
26 | },
27 | {
28 | "question": "Q: Allan brought 2 balloons to the park and then bought 3 more balloons there. If Jake brought 6 balloons to the park How many more balloons did Jake have than Allan in the park?\nA:",
29 | "rationale": "Let's think step by step. Allan brought 2 balloons to the park and then bought 3 more balloons there, so he had a total of 2 + 3 = 5 balloons in the park. Jake brought 6 balloons to the park, so he had 6 - 5 = 1 more balloon than Allan in the park. Therefore, Jake had 1 more balloon than Allan in the park.",
30 | "pred_ans": "1",
31 | "gold_ans": "1"
32 | },
33 | {
34 | "question": "Q: Jake has 84 more apples and 10 fewer peaches than Steven. Steven has 13 peaches and 52 apples. How many peaches does Jake have?\nA:",
35 | "rationale": "Let's think step by step. First, we need to find out how many apples Jake has. We know that Jake has 84 more apples than Steven, who has 52 apples. So, Jake has: 52 + 84 = 136 apples Next, we need to find out how many peaches Jake has. We know that Jake has 10 fewer peaches than Steven, who has 13 peaches. So, Jake has: 13 - 10 = 3 peaches Therefore, Jake has 3 peaches.",
36 | "pred_ans": "3",
37 | "gold_ans": "3"
38 | },
39 | {
40 | "question": "Q: Jerry had 8 action figures and 9 books on a shelf in his room. Later he added 10 more books to the shelf. How many books were on his shelf in all?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the total number of books Jerry had on the shelf before adding 10 more books. We know that he had 9 books on the shelf initially, so we add that to the number of books he added later: 9 + 10 = 19 So, Jerry had 19 books on the shelf after adding 10 more books.",
42 | "pred_ans": "19",
43 | "gold_ans": "19"
44 | },
45 | {
46 | "question": "Q: 6 birds were sitting on the fence. 4 more birds and 8 more storks came to join them. How many birds are sitting on the fence?\nA:",
47 | "rationale": "Let's think step by step. First, we need to find the total number of birds that were on the fence before the others joined. We know that there were 6 birds on the fence initially. Next, we need to add the number of birds that joined them. We are told that 4 more birds and 8 more storks came to join them. So, the total number of birds that joined them is 4 + 8 = 12. Finally, we can add the number of birds that were already on the fence to the number of birds that joined them to find the total number of birds on the fence. 6 (initial birds) + 12 (birds that joined) = 18 Therefore, there are 18 birds sitting on the fence.",
48 | "pred_ans": "18",
49 | "gold_ans": "10"
50 | },
51 | {
52 | "question": "Q: Zachary did 59 push-ups and 44 crunches in gym class today. David did 19 more push-ups but 27 less crunches than zachary. How many push-ups did David do?\nA:",
53 | "rationale": "Let's think step by step. Step 1: We know that Zachary did 59 push-ups and 44 crunches. Step 2: We also know that David did 19 more push-ups than Zachary, so we can add 19 to 59 to get David's push-up count: 59 + 19 = 78 push-ups. Step 3: We also know that David did 27 less crunches than Zachary, so we can subtract 27 from 44 to get David's crunch count: 44 - 27 = 17 crunches. Step 4: Therefore, David did 78 push-ups and 17 crunches.",
54 | "pred_ans": "78",
55 | "gold_ans": "78"
56 | }
57 | ],
58 | "inertia": 423.7147216796875
59 | }
--------------------------------------------------------------------------------
/demos/svamp_gpt-3.5-turbo-0301_8:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: 28 children were riding on the bus. At the bus stop 82 children got on the bus while some got off the bus. Then there were 30 children altogether on the bus. How many more children got on the bus than those that got off?\nA:",
5 | "rationale": "Let's think step by step. First, we need to find out how many children got off the bus. We know that there were 28 children on the bus before the stop, and 82 got on, so there were 28 + 82 = 110 children on the bus at the stop. Next, we subtract the number of children on the bus after the stop (30) from the number of children on the bus at the stop (110) to find out how many got off: 110 - 30 = 80. Therefore, 80 children got off the bus. Finally, we subtract the number of children who got off the bus (80) from the number of children who got on the bus (82) to find out how many more got on than got off: 82 - 80 = 2. Therefore, 2 more children got on the bus than got off.",
6 | "pred_ans": "2",
7 | "gold_ans": "2"
8 | },
9 | {
10 | "question": "Q: Danny collects bottle caps and wrappers. He found 22 bottle caps and 30 wrappers at the park. Now he has 17 bottle caps and 57 wrappers in his collection. How many wrappers did danny have at first?\nA:",
11 | "rationale": "Let's think step by step. First, we need to find out how many bottle caps and wrappers Danny had at first. We can do this by adding the number of bottle caps and wrappers he found at the park to the number he has in his collection now: Initial number of bottle caps = 22 + 17 = 39 Initial number of wrappers = 30 + 57 = 87 Therefore, Danny had 87 wrappers at first.",
12 | "pred_ans": "87",
13 | "gold_ans": "27"
14 | },
15 | {
16 | "question": "Q: Jerry had 8 action figures and 9 books on a shelf in his room. Later he added 10 more books to the shelf. How many books were on his shelf in all?\nA:",
17 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find the total number of books Jerry had on the shelf before adding 10 more books. We know that he had 9 books on the shelf initially, so we add that to the number of books he added later: 9 + 10 = 19 So, Jerry had 19 books on the shelf after adding 10 more books.",
18 | "pred_ans": "19",
19 | "gold_ans": "19"
20 | },
21 | {
22 | "question": "Q: Bobby had 21 pieces of candy. He ate 5 pieces of candy. Then he ate 9 more. How many pieces of candy does he still have left?\nA:",
23 | "rationale": "Let's think step by step. First, Bobby had 21 pieces of candy. Then he ate 5 pieces of candy, so he now has 21 - 5 = 16 pieces of candy left. After that, he ate 9 more pieces of candy, so he now has 16 - 9 = 7 pieces of candy left. Therefore, Bobby has 7 pieces of candy left.",
24 | "pred_ans": "7",
25 | "gold_ans": "7"
26 | },
27 | {
28 | "question": "Q: Jake has 3 fewer peaches and 4 more apples than Steven. Steven has 19 apples and 15 peaches. How many more apples than peaches does Steven have?\nA:",
29 | "rationale": "Let's think step by step. Sure, let's solve this problem step by step. First, we need to find out how many apples and peaches Jake has. We know that Jake has 3 fewer peaches than Steven, so Jake has 15 - 3 = 12 peaches. We also know that Jake has 4 more apples than Steven, so Jake has 19 + 4 = 23 apples. Next, we need to find out how many more apples than peaches Steven has. Steven has 19 apples and 15 peaches, so he has 19 - 15 = 4 more apples than peaches. Therefore, Steven has 4 more apples than peaches.",
30 | "pred_ans": "4",
31 | "gold_ans": "4"
32 | },
33 | {
34 | "question": "Q: The grasshopper and the frog had a jumping contest. The frog jumped 39 inches and the grasshopper jumped 17 inches. How much farther did the frog jump than the grasshopper?\nA:",
35 | "rationale": "Let's think step by step. Sure, let's break it down step by step. Step 1: Find the difference between the two jumps. To find how much farther the frog jumped than the grasshopper, we need to subtract the length of the grasshopper's jump from the length of the frog's jump. 39 inches - 17 inches = 22 inches Therefore, the frog jumped 22 inches farther than the grasshopper.",
36 | "pred_ans": "22",
37 | "gold_ans": "22"
38 | },
39 | {
40 | "question": "Q: Mary is baking a cake. The recipe calls for 9 cups of flour and 5 cups of sugar. She already put in 3 cups of flour and 62 cups of sugar. How many more cups of flour does she need to add?\nA:",
41 | "rationale": "Let's think step by step. Sure, let's break it down. Mary needs a total of 9 cups of flour for the recipe, and she has already added 3 cups. So, she still needs to add 9 - 3 = 6 cups of flour. Therefore, Mary needs to add 6 more cups of flour to complete the recipe.",
42 | "pred_ans": "6",
43 | "gold_ans": "6"
44 | },
45 | {
46 | "question": "Q: Every day Ryan spends 6 hours on learning english and 7 hours on learning chinese. How many more hours does he spend on learning chinese than he does on learning english?\nA:",
47 | "rationale": "Let's think step by step. Sure, let's break it down. First, we need to find the difference between the number of hours Ryan spends on learning Chinese and English. To do this, we can subtract the number of hours he spends on learning English from the number of hours he spends on learning Chinese: 7 hours (Chinese) - 6 hours (English) = 1 hour Therefore, Ryan spends 1 more hour on learning Chinese than he does on learning English.",
48 | "pred_ans": "1",
49 | "gold_ans": "1"
50 | }
51 | ],
52 | "inertia": 439.5946350097656
53 | }
--------------------------------------------------------------------------------
/demos/svamp_manual:
--------------------------------------------------------------------------------
1 | {
2 | "demo": [
3 | {
4 | "question": "Q: There are 15 trees in the grove. Grove workers will plant trees in the grove today. After they are done, there will be 21 trees. How many trees did the grove workers plant today?\nA:",
5 | "rationale": "There are 15 trees originally. Then there were 21 trees after some more were planted. So there must have been 21 - 15 = 6.",
6 | "pred_ans": "6"
7 | },
8 | {
9 | "question": "Q: If there are 3 cars in the parking lot and 2 more cars arrive, how many cars are in the parking lot?\nA:",
10 | "rationale": "There are originally 3 cars. 2 more cars arrive. 3 + 2 = 5.",
11 | "pred_ans": "5"
12 | },
13 | {
14 | "question": "Q: Leah had 32 chocolates and her sister had 42. If they ate 35, how many pieces do they have left in total?\nA:",
15 | "rationale": "Originally, Leah had 32 chocolates. Her sister had 42. So in total they had 32 + 42 = 74. After eating 35, they had 74 - 35 = 39.",
16 | "pred_ans": "39"
17 | },
18 | {
19 | "question": "Q: Jason had 20 lollipops. He gave Denny some lollipops. Now Jason has 12 lollipops. How many lollipops did Jason give to Denny?\nA:",
20 | "rationale": "Jason started with 20 lollipops. Then he had 12 after giving some to Denny. So he gave Denny 20 - 12 = 8.",
21 | "pred_ans": "8"
22 | },
23 | {
24 | "question": "Q: Shawn has five toys. For Christmas, he got two toys each from his mom and dad. How many toys does he have now?\nA:",
25 | "rationale": "Shawn started with 5 toys. If he got 2 toys each from his mom and dad, then that is 4 more toys. 5 + 4 = 9.",
26 | "pred_ans": "9"
27 | },
28 | {
29 | "question": "Q: There were nine computers in the server room. Five more computers were installed each day, from monday to thursday. How many computers are now in the server room?\nA:",
30 | "rationale": "There were originally 9 computers. For each of 4 days, 5 more computers were added. So 5 * 4 = 20 computers were added. 9 + 20 is 29.",
31 | "pred_ans": "29"
32 | },
33 | {
34 | "question": "Q: Michael had 58 golf balls. On tuesday, he lost 23 golf balls. On wednesday, he lost 2 more. How many golf balls did he have at the end of wednesday?\nA:",
35 | "rationale": "Michael started with 58 golf balls. After losing 23 on tuesday, he had 58 - 23 = 35. After losing 2 more, he had 35 - 2 = 33 golf balls.",
36 | "pred_ans": "33"
37 | },
38 | {
39 | "question": "Q: Olivia has $23. She bought five bagels for $3 each. How much money does she have left?\nA:",
40 | "rationale": "Olivia had 23 dollars. 5 bagels for 3 dollars each will be 5 x 3 = 15 dollars. So she has 23 - 15 dollars left. 23 - 15 is 8.",
41 | "pred_ans": "8"
42 | }
43 | ]
44 | }
--------------------------------------------------------------------------------
/echo.webp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Xalp/ECHO/5de37648cd8ea0f9cc87b3565a3c33a468dcdf96/echo.webp
--------------------------------------------------------------------------------
/run/create_demos.sh:
--------------------------------------------------------------------------------
1 | # Define the array of dataset names
2 | dataset_names=("multiarith" "gsm8k" "singleeq" "addsub" "aqua" "svamp" "commonsensqa" "strategyqa" "last_letters" "coin_flip") # Add more dataset names as needed
3 | model_name="gpt-3.5-turbo-0301"
4 |
5 | # Loop over dataset names
6 | for dataset_name in "${dataset_names[@]}"; do
7 |
8 | # Loop over cluster numbers from 8 to 32
9 | for num_clusters in {8..32}; do
10 |
11 | python run_demo.py \
12 | --task $dataset_name \
13 | --pred_file log/${dataset_name}_${model_name}_zero_shot_cot.log \
14 | --demo_save_dir demos/${dataset_name}_${model_name}_${num_clusters} \
15 | --num_clusters ${num_clusters}
16 |
17 | done
18 | done
--------------------------------------------------------------------------------
/run/create_log.sh:
--------------------------------------------------------------------------------
1 | # Define the array of dataset names
2 | dataset_names=("multiarith" "gsm8k" "singleeq" "addsub" "aqua" "svamp" "commonsensqa" "strategyqa" "last_letters" "coin_flip") # Add more dataset names as needed
3 | model_name="gpt-3.5-turbo-0301"
4 |
5 | # Loop over dataset names
6 | for dataset_name in "${dataset_names[@]}"; do
7 |
8 | python zero_shot_cot.py >> log/${dataset_name}_${model_name}_zero_shot_cot.log \
9 | --dataset ${dataset_name} \
10 | --method zero_shot_cot \
11 | --model ${model_name} \
12 | --limit_dataset_size 0
13 |
14 | done
--------------------------------------------------------------------------------
/run/run_echo.sh:
--------------------------------------------------------------------------------
1 | dataset_name="commonsensqa"
2 | model_name="gpt-3.5-turbo-0301"
3 | ECHO_model_name="gpt-3.5-turbo-0301"
4 | num_clusters=8
5 | iter_ECHO=2
6 |
7 | # step 3: generate the ECHO demo
8 | python run_ECHO.py \
9 | --dataset ${dataset_name} \
10 | --method auto_cot \
11 | --demo_path demos/${dataset_name}_${model_name}_${num_clusters} \
12 | --output_dir ECHO_demos/${dataset_name}_${ECHO_model_name}_${num_clusters}_${iter_ECHO} \
13 | --iter ${iter_ECHO} \
14 | --model ${ECHO_model_name}
15 |
16 | # sleep 2
17 |
18 | # # step 4: inference and evaluate
19 | # python run_inference.py \
20 | # --dataset $dataset_name \
21 | # --demo_path ECHO_demos/${dataset_name}_${ECHO_model_name}_${num_clusters}_${iter_ECHO} \
22 | # --output_dir experiment/${dataset_name}_${model_name}_${num_clusters}_${iter_ECHO} \
23 | # --method auto_cot \
24 | # --model $model_name
--------------------------------------------------------------------------------
/run/run_echo_max.sh:
--------------------------------------------------------------------------------
1 | dataset_name="coin_flip"
2 | model_name="gpt-3.5-turbo-0301"
3 | num_clusters=32
4 | iter_CAT=3
5 |
6 |
7 | # step 3: generate the CAT demo
8 | python run_ECHO_max.py \
9 | --dataset ${dataset_name} \
10 | --method auto_cot \
11 | --demo_path demos/${dataset_name}_${model_name} \
12 | --output_dir ECHO_demos/${dataset_name}_${model_name}_max \
13 | --model ${model_name}
14 |
15 | sleep 2
16 |
17 | # # step 4: inference and evaluate
18 | # python run_inference.py \
19 | # --dataset $dataset_name \
20 | # --demo_path ECHO_demos/${dataset_name}_${model_name}_max \
21 | # --output_dir experiment/${dataset_name}_${model_name}_${num_clusters}_max \
22 | # --method auto_cot \
23 | # --model $model_name
--------------------------------------------------------------------------------