├── .gitignore
├── LICENSE.txt
├── README.md
├── README_JA.md
├── README_ZH.md
├── benchmark
    ├── README.md
    ├── benchmark_eval.py
    ├── infer_baichuan.py
    ├── infer_qwen.py
    └── requirements.txt
├── blob
    ├── example-zh.gif
    ├── example.gif
    ├── logo.png
    └── overview.png
├── examples
    └── custom_tool_example.py
├── kwaiagents
    ├── agent_start.py
    ├── agents
    │   ├── __init__.py
    │   ├── agent_profile.py
    │   ├── kagent.py
    │   └── prompts.py
    ├── config.py
    ├── llms
    │   ├── __init__.py
    │   └── clients.py
    ├── tools
    │   ├── __init__.py
    │   ├── base.py
    │   ├── browser.py
    │   ├── calendars.py
    │   ├── commons.py
    │   ├── search.py
    │   ├── solarterms.py
    │   ├── timedelta.py
    │   └── weather.py
    └── utils
    │   ├── chain_logger.py
    │   ├── date_utils.py
    │   ├── function_utils.py
    │   ├── html_utils.py
    │   ├── json_fix_general.py
    │   ├── nlp_utils.py
    │   └── selenium_utils.py
├── requirements.txt
└── setup.py


/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | share/python-wheels/
 24 | *.egg-info/
 25 | .installed.cfg
 26 | *.egg
 27 | MANIFEST
 28 | 
 29 | # PyInstaller
 30 | #  Usually these files are written by a python script from a template
 31 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 32 | *.manifest
 33 | *.spec
 34 | 
 35 | # Installer logs
 36 | pip-log.txt
 37 | pip-delete-this-directory.txt
 38 | 
 39 | # Unit test / coverage reports
 40 | htmlcov/
 41 | .tox/
 42 | .nox/
 43 | .coverage
 44 | .coverage.*
 45 | .cache
 46 | nosetests.xml
 47 | coverage.xml
 48 | *.cover
 49 | *.py,cover
 50 | .hypothesis/
 51 | .pytest_cache/
 52 | cover/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | .pybuilder/
 76 | target/
 77 | 
 78 | # Jupyter Notebook
 79 | .ipynb_checkpoints
 80 | 
 81 | # IPython
 82 | profile_default/
 83 | ipython_config.py
 84 | 
 85 | # pyenv
 86 | #   For a library or package, you might want to ignore these files since the code is
 87 | #   intended to run in multiple environments; otherwise, check them in:
 88 | # .python-version
 89 | 
 90 | # pipenv
 91 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 92 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 93 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 94 | #   install all needed dependencies.
 95 | #Pipfile.lock
 96 | 
 97 | # poetry
 98 | #   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
 99 | #   This is especially recommended for binary packages to ensure reproducibility, and is more
100 | #   commonly ignored for libraries.
101 | #   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
102 | #poetry.lock
103 | 
104 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow
105 | __pypackages__/
106 | 
107 | # Celery stuff
108 | celerybeat-schedule
109 | celerybeat.pid
110 | 
111 | # SageMath parsed files
112 | *.sage.py
113 | 
114 | # Environments
115 | .env
116 | .venv
117 | env/
118 | venv/
119 | ENV/
120 | env.bak/
121 | venv.bak/
122 | 
123 | # Spyder project settings
124 | .spyderproject
125 | .spyproject
126 | 
127 | # Rope project settings
128 | .ropeproject
129 | 
130 | # mkdocs documentation
131 | /site
132 | 
133 | # mypy
134 | .mypy_cache/
135 | .dmypy.json
136 | dmypy.json
137 | 
138 | # Pyre type checker
139 | .pyre/
140 | 
141 | # pytype static type analyzer
142 | .pytype/
143 | 
144 | # Cython debug symbols
145 | cython_debug/
146 | 
147 | # data
148 | data/
149 | 
150 | # test
151 | test.py
152 | 
153 | # querys
154 | querys.txt
155 | 
156 | # scripts
157 | scripts/stat.py
158 | scripts/stat1.py
159 | 
160 | # PyCharm
161 | #  JetBrains specific template is maintainted in a separate JetBrains.gitignore that can
162 | #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
163 | #  and can be added to the global gitignore or merged into this file.  For a more nuclear
164 | #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
165 | #.idea/


--------------------------------------------------------------------------------
/LICENSE.txt:
--------------------------------------------------------------------------------
  1 | Attribution-NonCommercial-ShareAlike 4.0 International
  2 | 
  3 | =======================================================================
  4 | 
  5 | Creative Commons Corporation ("Creative Commons") is not a law firm and
  6 | does not provide legal services or legal advice. Distribution of
  7 | Creative Commons public licenses does not create a lawyer-client or
  8 | other relationship. Creative Commons makes its licenses and related
  9 | information available on an "as-is" basis. Creative Commons gives no
 10 | warranties regarding its licenses, any material licensed under their
 11 | terms and conditions, or any related information. Creative Commons
 12 | disclaims all liability for damages resulting from their use to the
 13 | fullest extent possible.
 14 | 
 15 | Using Creative Commons Public Licenses
 16 | 
 17 | Creative Commons public licenses provide a standard set of terms and
 18 | conditions that creators and other rights holders may use to share
 19 | original works of authorship and other material subject to copyright
 20 | and certain other rights specified in the public license below. The
 21 | following considerations are for informational purposes only, are not
 22 | exhaustive, and do not form part of our licenses.
 23 | 
 24 |      Considerations for licensors: Our public licenses are
 25 |      intended for use by those authorized to give the public
 26 |      permission to use material in ways otherwise restricted by
 27 |      copyright and certain other rights. Our licenses are
 28 |      irrevocable. Licensors should read and understand the terms
 29 |      and conditions of the license they choose before applying it.
 30 |      Licensors should also secure all rights necessary before
 31 |      applying our licenses so that the public can reuse the
 32 |      material as expected. Licensors should clearly mark any
 33 |      material not subject to the license. This includes other CC-
 34 |      licensed material, or material used under an exception or
 35 |      limitation to copyright. More considerations for licensors:
 36 |     wiki.creativecommons.org/Considerations_for_licensors
 37 | 
 38 |      Considerations for the public: By using one of our public
 39 |      licenses, a licensor grants the public permission to use the
 40 |      licensed material under specified terms and conditions. If
 41 |      the licensor's permission is not necessary for any reason--for
 42 |      example, because of any applicable exception or limitation to
 43 |      copyright--then that use is not regulated by the license. Our
 44 |      licenses grant only permissions under copyright and certain
 45 |      other rights that a licensor has authority to grant. Use of
 46 |      the licensed material may still be restricted for other
 47 |      reasons, including because others have copyright or other
 48 |      rights in the material. A licensor may make special requests,
 49 |      such as asking that all changes be marked or described.
 50 |      Although not required by our licenses, you are encouraged to
 51 |      respect those requests where reasonable. More considerations
 52 |      for the public:
 53 |     wiki.creativecommons.org/Considerations_for_licensees
 54 | 
 55 | =======================================================================
 56 | 
 57 | Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International
 58 | Public License
 59 | 
 60 | By exercising the Licensed Rights (defined below), You accept and agree
 61 | to be bound by the terms and conditions of this Creative Commons
 62 | Attribution-NonCommercial-ShareAlike 4.0 International Public License
 63 | ("Public License"). To the extent this Public License may be
 64 | interpreted as a contract, You are granted the Licensed Rights in
 65 | consideration of Your acceptance of these terms and conditions, and the
 66 | Licensor grants You such rights in consideration of benefits the
 67 | Licensor receives from making the Licensed Material available under
 68 | these terms and conditions.
 69 | 
 70 | 
 71 | Section 1 -- Definitions.
 72 | 
 73 |   a. Adapted Material means material subject to Copyright and Similar
 74 |      Rights that is derived from or based upon the Licensed Material
 75 |      and in which the Licensed Material is translated, altered,
 76 |      arranged, transformed, or otherwise modified in a manner requiring
 77 |      permission under the Copyright and Similar Rights held by the
 78 |      Licensor. For purposes of this Public License, where the Licensed
 79 |      Material is a musical work, performance, or sound recording,
 80 |      Adapted Material is always produced where the Licensed Material is
 81 |      synched in timed relation with a moving image.
 82 | 
 83 |   b. Adapter's License means the license You apply to Your Copyright
 84 |      and Similar Rights in Your contributions to Adapted Material in
 85 |      accordance with the terms and conditions of this Public License.
 86 | 
 87 |   c. BY-NC-SA Compatible License means a license listed at
 88 |      creativecommons.org/compatiblelicenses, approved by Creative
 89 |      Commons as essentially the equivalent of this Public License.
 90 | 
 91 |   d. Copyright and Similar Rights means copyright and/or similar rights
 92 |      closely related to copyright including, without limitation,
 93 |      performance, broadcast, sound recording, and Sui Generis Database
 94 |      Rights, without regard to how the rights are labeled or
 95 |      categorized. For purposes of this Public License, the rights
 96 |      specified in Section 2(b)(1)-(2) are not Copyright and Similar
 97 |      Rights.
 98 | 
 99 |   e. Effective Technological Measures means those measures that, in the
100 |      absence of proper authority, may not be circumvented under laws
101 |      fulfilling obligations under Article 11 of the WIPO Copyright
102 |      Treaty adopted on December 20, 1996, and/or similar international
103 |      agreements.
104 | 
105 |   f. Exceptions and Limitations means fair use, fair dealing, and/or
106 |      any other exception or limitation to Copyright and Similar Rights
107 |      that applies to Your use of the Licensed Material.
108 | 
109 |   g. License Elements means the license attributes listed in the name
110 |      of a Creative Commons Public License. The License Elements of this
111 |      Public License are Attribution, NonCommercial, and ShareAlike.
112 | 
113 |   h. Licensed Material means the artistic or literary work, database,
114 |      or other material to which the Licensor applied this Public
115 |      License.
116 | 
117 |   i. Licensed Rights means the rights granted to You subject to the
118 |      terms and conditions of this Public License, which are limited to
119 |      all Copyright and Similar Rights that apply to Your use of the
120 |      Licensed Material and that the Licensor has authority to license.
121 | 
122 |   j. Licensor means the individual(s) or entity(ies) granting rights
123 |      under this Public License.
124 | 
125 |   k. NonCommercial means not primarily intended for or directed towards
126 |      commercial advantage or monetary compensation. For purposes of
127 |      this Public License, the exchange of the Licensed Material for
128 |      other material subject to Copyright and Similar Rights by digital
129 |      file-sharing or similar means is NonCommercial provided there is
130 |      no payment of monetary compensation in connection with the
131 |      exchange.
132 | 
133 |   l. Share means to provide material to the public by any means or
134 |      process that requires permission under the Licensed Rights, such
135 |      as reproduction, public display, public performance, distribution,
136 |      dissemination, communication, or importation, and to make material
137 |      available to the public including in ways that members of the
138 |      public may access the material from a place and at a time
139 |      individually chosen by them.
140 | 
141 |   m. Sui Generis Database Rights means rights other than copyright
142 |      resulting from Directive 96/9/EC of the European Parliament and of
143 |      the Council of 11 March 1996 on the legal protection of databases,
144 |      as amended and/or succeeded, as well as other essentially
145 |      equivalent rights anywhere in the world.
146 | 
147 |   n. You means the individual or entity exercising the Licensed Rights
148 |      under this Public License. Your has a corresponding meaning.
149 | 
150 | 
151 | Section 2 -- Scope.
152 | 
153 |   a. License grant.
154 | 
155 |        1. Subject to the terms and conditions of this Public License,
156 |           the Licensor hereby grants You a worldwide, royalty-free,
157 |           non-sublicensable, non-exclusive, irrevocable license to
158 |           exercise the Licensed Rights in the Licensed Material to:
159 | 
160 |             a. reproduce and Share the Licensed Material, in whole or
161 |                in part, for NonCommercial purposes only; and
162 | 
163 |             b. produce, reproduce, and Share Adapted Material for
164 |                NonCommercial purposes only.
165 | 
166 |        2. Exceptions and Limitations. For the avoidance of doubt, where
167 |           Exceptions and Limitations apply to Your use, this Public
168 |           License does not apply, and You do not need to comply with
169 |           its terms and conditions.
170 | 
171 |        3. Term. The term of this Public License is specified in Section
172 |           6(a).
173 | 
174 |        4. Media and formats; technical modifications allowed. The
175 |           Licensor authorizes You to exercise the Licensed Rights in
176 |           all media and formats whether now known or hereafter created,
177 |           and to make technical modifications necessary to do so. The
178 |           Licensor waives and/or agrees not to assert any right or
179 |           authority to forbid You from making technical modifications
180 |           necessary to exercise the Licensed Rights, including
181 |           technical modifications necessary to circumvent Effective
182 |           Technological Measures. For purposes of this Public License,
183 |           simply making modifications authorized by this Section 2(a)
184 |           (4) never produces Adapted Material.
185 | 
186 |        5. Downstream recipients.
187 | 
188 |             a. Offer from the Licensor -- Licensed Material. Every
189 |                recipient of the Licensed Material automatically
190 |                receives an offer from the Licensor to exercise the
191 |                Licensed Rights under the terms and conditions of this
192 |                Public License.
193 | 
194 |             b. Additional offer from the Licensor -- Adapted Material.
195 |                Every recipient of Adapted Material from You
196 |                automatically receives an offer from the Licensor to
197 |                exercise the Licensed Rights in the Adapted Material
198 |                under the conditions of the Adapter's License You apply.
199 | 
200 |             c. No downstream restrictions. You may not offer or impose
201 |                any additional or different terms or conditions on, or
202 |                apply any Effective Technological Measures to, the
203 |                Licensed Material if doing so restricts exercise of the
204 |                Licensed Rights by any recipient of the Licensed
205 |                Material.
206 | 
207 |        6. No endorsement. Nothing in this Public License constitutes or
208 |           may be construed as permission to assert or imply that You
209 |           are, or that Your use of the Licensed Material is, connected
210 |           with, or sponsored, endorsed, or granted official status by,
211 |           the Licensor or others designated to receive attribution as
212 |           provided in Section 3(a)(1)(A)(i).
213 | 
214 |   b. Other rights.
215 | 
216 |        1. Moral rights, such as the right of integrity, are not
217 |           licensed under this Public License, nor are publicity,
218 |           privacy, and/or other similar personality rights; however, to
219 |           the extent possible, the Licensor waives and/or agrees not to
220 |           assert any such rights held by the Licensor to the limited
221 |           extent necessary to allow You to exercise the Licensed
222 |           Rights, but not otherwise.
223 | 
224 |        2. Patent and trademark rights are not licensed under this
225 |           Public License.
226 | 
227 |        3. To the extent possible, the Licensor waives any right to
228 |           collect royalties from You for the exercise of the Licensed
229 |           Rights, whether directly or through a collecting society
230 |           under any voluntary or waivable statutory or compulsory
231 |           licensing scheme. In all other cases the Licensor expressly
232 |           reserves any right to collect such royalties, including when
233 |           the Licensed Material is used other than for NonCommercial
234 |           purposes.
235 | 
236 | 
237 | Section 3 -- License Conditions.
238 | 
239 | Your exercise of the Licensed Rights is expressly made subject to the
240 | following conditions.
241 | 
242 |   a. Attribution.
243 | 
244 |        1. If You Share the Licensed Material (including in modified
245 |           form), You must:
246 | 
247 |             a. retain the following if it is supplied by the Licensor
248 |                with the Licensed Material:
249 | 
250 |                  i. identification of the creator(s) of the Licensed
251 |                     Material and any others designated to receive
252 |                     attribution, in any reasonable manner requested by
253 |                     the Licensor (including by pseudonym if
254 |                     designated);
255 | 
256 |                 ii. a copyright notice;
257 | 
258 |                iii. a notice that refers to this Public License;
259 | 
260 |                 iv. a notice that refers to the disclaimer of
261 |                     warranties;
262 | 
263 |                  v. a URI or hyperlink to the Licensed Material to the
264 |                     extent reasonably practicable;
265 | 
266 |             b. indicate if You modified the Licensed Material and
267 |                retain an indication of any previous modifications; and
268 | 
269 |             c. indicate the Licensed Material is licensed under this
270 |                Public License, and include the text of, or the URI or
271 |                hyperlink to, this Public License.
272 | 
273 |        2. You may satisfy the conditions in Section 3(a)(1) in any
274 |           reasonable manner based on the medium, means, and context in
275 |           which You Share the Licensed Material. For example, it may be
276 |           reasonable to satisfy the conditions by providing a URI or
277 |           hyperlink to a resource that includes the required
278 |           information.
279 |        3. If requested by the Licensor, You must remove any of the
280 |           information required by Section 3(a)(1)(A) to the extent
281 |           reasonably practicable.
282 | 
283 |   b. ShareAlike.
284 | 
285 |      In addition to the conditions in Section 3(a), if You Share
286 |      Adapted Material You produce, the following conditions also apply.
287 | 
288 |        1. The Adapter's License You apply must be a Creative Commons
289 |           license with the same License Elements, this version or
290 |           later, or a BY-NC-SA Compatible License.
291 | 
292 |        2. You must include the text of, or the URI or hyperlink to, the
293 |           Adapter's License You apply. You may satisfy this condition
294 |           in any reasonable manner based on the medium, means, and
295 |           context in which You Share Adapted Material.
296 | 
297 |        3. You may not offer or impose any additional or different terms
298 |           or conditions on, or apply any Effective Technological
299 |           Measures to, Adapted Material that restrict exercise of the
300 |           rights granted under the Adapter's License You apply.
301 | 
302 | 
303 | Section 4 -- Sui Generis Database Rights.
304 | 
305 | Where the Licensed Rights include Sui Generis Database Rights that
306 | apply to Your use of the Licensed Material:
307 | 
308 |   a. for the avoidance of doubt, Section 2(a)(1) grants You the right
309 |      to extract, reuse, reproduce, and Share all or a substantial
310 |      portion of the contents of the database for NonCommercial purposes
311 |      only;
312 | 
313 |   b. if You include all or a substantial portion of the database
314 |      contents in a database in which You have Sui Generis Database
315 |      Rights, then the database in which You have Sui Generis Database
316 |      Rights (but not its individual contents) is Adapted Material,
317 |      including for purposes of Section 3(b); and
318 | 
319 |   c. You must comply with the conditions in Section 3(a) if You Share
320 |      all or a substantial portion of the contents of the database.
321 | 
322 | For the avoidance of doubt, this Section 4 supplements and does not
323 | replace Your obligations under this Public License where the Licensed
324 | Rights include other Copyright and Similar Rights.
325 | 
326 | 
327 | Section 5 -- Disclaimer of Warranties and Limitation of Liability.
328 | 
329 |   a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE
330 |      EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS
331 |      AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF
332 |      ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,
333 |      IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,
334 |      WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR
335 |      PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,
336 |      ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT
337 |      KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT
338 |      ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.
339 | 
340 |   b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE
341 |      TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,
342 |      NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,
343 |      INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,
344 |      COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR
345 |      USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN
346 |      ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR
347 |      DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR
348 |      IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.
349 | 
350 |   c. The disclaimer of warranties and limitation of liability provided
351 |      above shall be interpreted in a manner that, to the extent
352 |      possible, most closely approximates an absolute disclaimer and
353 |      waiver of all liability.
354 | 
355 | 
356 | Section 6 -- Term and Termination.
357 | 
358 |   a. This Public License applies for the term of the Copyright and
359 |      Similar Rights licensed here. However, if You fail to comply with
360 |      this Public License, then Your rights under this Public License
361 |      terminate automatically.
362 | 
363 |   b. Where Your right to use the Licensed Material has terminated under
364 |      Section 6(a), it reinstates:
365 | 
366 |        1. automatically as of the date the violation is cured, provided
367 |           it is cured within 30 days of Your discovery of the
368 |           violation; or
369 | 
370 |        2. upon express reinstatement by the Licensor.
371 | 
372 |      For the avoidance of doubt, this Section 6(b) does not affect any
373 |      right the Licensor may have to seek remedies for Your violations
374 |      of this Public License.
375 | 
376 |   c. For the avoidance of doubt, the Licensor may also offer the
377 |      Licensed Material under separate terms or conditions or stop
378 |      distributing the Licensed Material at any time; however, doing so
379 |      will not terminate this Public License.
380 | 
381 |   d. Sections 1, 5, 6, 7, and 8 survive termination of this Public
382 |      License.
383 | 
384 | 
385 | Section 7 -- Other Terms and Conditions.
386 | 
387 |   a. The Licensor shall not be bound by any additional or different
388 |      terms or conditions communicated by You unless expressly agreed.
389 | 
390 |   b. Any arrangements, understandings, or agreements regarding the
391 |      Licensed Material not stated herein are separate from and
392 |      independent of the terms and conditions of this Public License.
393 | 
394 | 
395 | Section 8 -- Interpretation.
396 | 
397 |   a. For the avoidance of doubt, this Public License does not, and
398 |      shall not be interpreted to, reduce, limit, restrict, or impose
399 |      conditions on any use of the Licensed Material that could lawfully
400 |      be made without permission under this Public License.
401 | 
402 |   b. To the extent possible, if any provision of this Public License is
403 |      deemed unenforceable, it shall be automatically reformed to the
404 |      minimum extent necessary to make it enforceable. If the provision
405 |      cannot be reformed, it shall be severed from this Public License
406 |      without affecting the enforceability of the remaining terms and
407 |      conditions.
408 | 
409 |   c. No term or condition of this Public License will be waived and no
410 |      failure to comply consented to unless expressly agreed to by the
411 |      Licensor.
412 | 
413 |   d. Nothing in this Public License constitutes or may be interpreted
414 |      as a limitation upon, or waiver of, any privileges and immunities
415 |      that apply to the Licensor or You, including from the legal
416 |      processes of any jurisdiction or authority.
417 | 
418 | =======================================================================
419 | 
420 | Creative Commons is not a party to its public
421 | licenses. Notwithstanding, Creative Commons may elect to apply one of
422 | its public licenses to material it publishes and in those instances
423 | will be considered the “Licensor.” The text of the Creative Commons
424 | public licenses is dedicated to the public domain under the CC0 Public
425 | Domain Dedication. Except for the limited purpose of indicating that
426 | material is shared under a Creative Commons public license or as
427 | otherwise permitted by the Creative Commons policies published at
428 | creativecommons.org/policies, Creative Commons does not authorize the
429 | use of the trademark "Creative Commons" or any other trademark or logo
430 | of Creative Commons without its prior written consent including,
431 | without limitation, in connection with any unauthorized modifications
432 | to any of its public licenses or any other arrangements,
433 | understandings, or agreements concerning use of licensed material. For
434 | the avoidance of doubt, this paragraph does not form part of the
435 | public licenses.
436 | 
437 | Creative Commons may be contacted at creativecommons.org.


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | <p align="left">
  2 |     English ｜ <a href="README_ZH.md">中文</a> | <a href="README_JA.md">日本語</a>
  3 | </p>
  4 | <br><br>
  5 | 
  6 | <p align="center">
  7 |     <img src="blob/logo.png" width="400"/>
  8 | <p>
  9 | <br>
 10 | 
 11 | <p align="center">
 12 |       📚 <a href="https://huggingface.co/datasets/kwaikeg/KAgentInstruct">Dataset</a> | 📚 <a href="https://huggingface.co/datasets/kwaikeg/KAgentBench">Benchmark</a> | 🤗 <a href="https://huggingface.co/collections/kwaikeg/kagentlms-6551e685b5ec9f9a077d42ef">Models</a> | 📑 <a href="http://arxiv.org/abs/2312.04889">Paper</a>
 13 | <br>
 14 | 
 15 | KwaiAgents is a series of Agent-related works open-sourced by the [KwaiKEG](https://github.com/KwaiKEG) from [Kuaishou Technology](https://www.kuaishou.com/en). The open-sourced content includes:
 16 | 
 17 | 1. **KAgentSys-Lite**: a lite version of the KAgentSys in the paper. While retaining some of the original system's functionality, KAgentSys-Lite has certain differences and limitations when compared to its full-featured counterpart, such as: (1) a more limited set of tools; (2) a lack of memory mechanisms; (3) slightly reduced performance capabilities; and (4) a different codebase, as it evolves from open-source projects like BabyAGI and Auto-GPT. Despite these modifications, KAgentSys-Lite still delivers comparable performance among numerous open-source Agent systems available.
 18 | 2. **KAgentLMs**: a series of large language models with agent capabilities such as planning, reflection, and tool-use, acquired through the Meta-agent tuning proposed in the paper.
 19 | 3. **KAgentInstruct**: over 200k Agent-related instructions finetuning data (partially human-edited) proposed in the paper.
 20 | 4. **KAgentBench**: over 3,000 human-edited, automated evaluation data for testing Agent capabilities, with evaluation dimensions including planning, tool-use, reflection, concluding, and profiling.
 21 | 
 22 | <br>
 23 | <table align='center'>
 24 |     <tr>
 25 |         <td align='center'><b>Type</b></td>
 26 |         <td align='center'><b>Models</b></td>
 27 |         <td align='center'><b>Training Data</b></td>
 28 |         <td align='center'><b>Benchmark Data</b></td>
 29 |     </tr>
 30 |     <tr>
 31 |         <td>Qwen</td>
 32 |         <td>
 33 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat">Qwen-7B-MAT</a> <br> 
 34 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_14b_mat">Qwen-14B-MAT</a> <br>
 35 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat_gguf">Qwen-7B-MAT-cpp</a> <br>
 36 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen1.5_14b_mat">Qwen1.5-14B-MAT</a>
 37 |         </td>
 38 |         <td align="center" rowspan="2"><a href="https://huggingface.co/datasets/kwaikeg/KAgentInstruct">KAgentInstruct</a></td>
 39 |         <td align="center" rowspan="2"><a href="https://huggingface.co/datasets/kwaikeg/KAgentBench">KAgentBench</a></td>
 40 |     </tr>
 41 |     <tr>
 42 |         <td>Baichuan</td>
 43 |         <td><a href="https://huggingface.co/kwaikeg/kagentlms_baichuan2_13b_mat">Baichuan2-13B-MAT</a></td>
 44 |     </tr>
 45 | </table>
 46 | 
 47 | 
 48 | <br>
 49 | <br>
 50 | 
 51 | <p align="center">
 52 |     <img src="blob/example.gif"/>
 53 | <p>
 54 | 
 55 | <br>
 56 | 
 57 | <p align="center">
 58 |     <img src="blob/overview.png"/>
 59 | <p>
 60 | 
 61 | ## News
 62 | * 2024.4.19 - Qwen1.5-14B-MAT model [[link]](https://huggingface.co/kwaikeg/kagentlms_qwen1.5_14b_mat) released. 
 63 | * 2024.4.9 - Benchmark results have been refreshed.
 64 | * 2024.1.29 - Qwen-14B-MAT model [[link]](https://huggingface.co/kwaikeg/kagentlms_qwen_14b_mat) released.
 65 | * 2023.1.5 - Training data [[link]](https://huggingface.co/datasets/kwaikeg/KAgentInstruct) released.
 66 | * 2023.12.27 - 🔥🔥🔥 KwaiAgents have been reported on many sites. [[机器之心]](https://mp.weixin.qq.com/s/QhZIFL1GHH90z98gnk194g) [[Medium]](https://medium.com/@myscarletpan/can-7b-models-now-master-ai-agents-a-look-at-kwais-recent-llm-open-source-release-8b9e84647412) [[InfoQ]](https://www.infoq.cn/article/xHGJwG3b8hXSdaP4m6r0), etc. 
 67 | * 2023.12.13 - The benchmark and evaluation code [[link]](https://huggingface.co/datasets/kwaikeg/KAgentBench) released.
 68 | * 2023.12.08 - Technical report [[link]](https://arxiv.org/abs/2312.04889) release.
 69 | * 2023.11.17 - Initial release.
 70 | 
 71 | ## Evaluation
 72 | 1. Benchmark Results
 73 |    
 74 | |                | Scale | Planning | Tool-use | Reflection | Concluding | Profile | Overall Score |
 75 | |----------------|-------|----------|----------|------------|------------|---------|---------------|
 76 | | GPT-3.5-turbo  |   -   |  18.55   |  26.26   |    8.06    |   37.26    |  35.42  |     25.63     |
 77 | | Llama2         |  13B  |   0.15   |   0.44   |    0.14    |   16.60    |  17.73  |      5.30     |
 78 | | ChatGLM3       |  6B   |   7.87   |  11.84   |    7.52    |   30.01    |  30.14  |     15.88     |
 79 | | Qwen           |  7B   |  13.34   |  18.00   |    7.91    |   36.24    |  34.99  |     21.17     |
 80 | | Baichuan2      |  13B  |   6.70   |  16.10   |    6.76    |   24.97    |  19.08  |     14.89     |
 81 | | ToolLlama      |  7B   |   0.20   |   4.83   |    1.06    |   15.62    |  10.66  |      6.04     |
 82 | | AgentLM        |  13B  |   0.17   |   0.15   |    0.05    |   16.30    |  15.22  |      4.88     |
 83 | | Qwen-MAT       |  7B   |  31.64   |  43.30   |   33.34    |   44.85    |  44.78  |     39.85     |
 84 | | Baichuan2-MAT  |  13B  |  37.27   |  52.97   |   37.00    |   48.01    |  41.83  |     45.34     |
 85 | | Qwen-MAT       |  14B  |  43.17   |  63.78   |   32.14    |   45.47    |  45.22  |     49.94     |
 86 | | Qwen1.5-MAT    |  14B  |  42.42   |  64.62   |   30.58    |   46.51    |  45.95  |     50.18     |
 87 | 
 88 | 
 89 | 2. Human evaluation. Each result cell shows the pass rate (\%) and the average score (in parentheses)
 90 | 
 91 | |                 | Scale   | NoAgent         | ReACT          | Auto-GPT        | KAgentSys       |
 92 | |-----------------|---------|-----------------|----------------|-----------------|-----------------|
 93 | | GPT-4           | -       | 57.21% (3.42)    | 68.66% (3.88)   | 79.60% (4.27)    | 83.58% (4.47)    |
 94 | | GPT-3.5-turbo   | -       | 47.26% (3.08)    | 54.23% (3.33)   | 61.74% (3.53)    | 64.18% (3.69)    |
 95 | | Qwen            | 7B      | 52.74% (3.23)    | 51.74% (3.20)   | 50.25% (3.11)    | 54.23% (3.27)    |
 96 | | Baichuan2       | 13B     | 54.23% (3.31)    | 55.72% (3.36)   | 57.21% (3.37)    | 58.71% (3.54)    |
 97 | | Qwen-MAT        | 7B      | -                | 58.71% (3.53)   | 65.67% (3.77)    | 67.66% (3.87)    |
 98 | | Baichuan2-MAT   | 13B     | -                | 61.19% (3.60)   | 66.67% (3.86)    | 74.13% (4.11)    |
 99 | 
100 | 
101 | ## User Guide
102 | 
103 | ### Prebuild environment
104 | Install miniconda for build environment first. Then create build env first:
105 | ```bash
106 | conda create -n kagent python=3.10
107 | conda activate kagent
108 | pip install -r requirements.txt
109 | ```
110 | 
111 | ### Using AgentLMs
112 | #### Serving by [vLLM](https://github.com/vllm-project/vllm) (GPU)
113 | We recommend using [vLLM](https://github.com/vllm-project/vllm) and [FastChat](https://github.com/lm-sys/FastChat) to deploy the model inference service. First, you need to install the corresponding packages (for detailed usage, please refer to the documentation of the two projects):
114 | 1. For Qwen-7B-MAT, install the corresponding packages with the following commands
115 | ```bash
116 | pip install vllm
117 | pip install "fschat[model_worker,webui]"
118 | ```
119 | 2. For Baichuan-13B-MAT, install the corresponding packages with the following commands
120 | ```bash
121 | pip install "fschat[model_worker,webui]"
122 | pip install vllm==0.2.0
123 | pip install transformers==4.33.2
124 | ```
125 | 
126 | To deploy KAgentLMs, you first need to start the controller in one terminal.
127 | ```bash
128 | python -m fastchat.serve.controller
129 | ```
130 | Secondly, you should use the following command in another terminal for single-gpu inference service deployment:
131 | ```bash
132 | python -m fastchat.serve.vllm_worker --model-path $model_path --trust-remote-code
133 | ```
134 | Where `$model_path` is the local path of the model downloaded. If the GPU does not support Bfloat16, you can add `--dtype half` to the command line.
135 | 
136 | Thirdly, start the REST API server in the third terminal.
137 | ```bash
138 | python -m fastchat.serve.openai_api_server --host localhost --port 8888
139 | ```
140 | 
141 | Finally, you can use the curl command to invoke the model same as the OpenAI calling format. Here's an example:
142 | ```bash
143 | curl http://localhost:8888/v1/chat/completions \
144 | -H "Content-Type: application/json" \
145 | -d '{"model": "kagentlms_qwen_7b_mat", "messages": [{"role": "user", "content": "Who is Andy Lau"}]}'
146 | ```
147 | Here, change `kagentlms_qwen_7b_mat` to the model you deployed.
148 | 
149 | #### Serving by [Lamma.cpp](https://github.com/ggerganov/llama.cpp) (CPU)
150 | llama-cpp-python offers a web server which aims to act as a drop-in replacement for the OpenAI API. This allows you to use llama.cpp compatible models with any OpenAI compatible client (language libraries, services, etc). The converted model can be found in [kwaikeg/kagentlms_qwen_7b_mat_gguf](https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat_gguf).
151 | 
152 | To install the server package and get started:
153 | ```bash
154 | pip install "llama-cpp-python[server]"
155 | python3 -m llama_cpp.server --model kagentlms_qwen_7b_mat_gguf/ggml-model-q4_0.gguf --chat_format chatml --port 8888
156 | ```
157 | 
158 | Finally, you can use the curl command to invoke the model same as the OpenAI calling format. Here's an example:
159 | ```bash
160 | curl http://localhost:8888/v1/chat/completions \
161 | -H "Content-Type: application/json" \
162 | -d '{"messages": [{"role": "user", "content": "Who is Andy Lau"}]}'
163 | ```
164 | 
165 | ### Using KAgentSys-Lite
166 | Download and install the KwaiAgents, recommended Python>=3.10
167 | ```bash
168 | git clone git@github.com:KwaiKEG/KwaiAgents.git
169 | cd KwaiAgents
170 | python setup.py develop
171 | ```
172 | 
173 | 1. **ChatGPT usage**
174 | Declare some environment variables
175 | ```
176 | export OPENAI_API_KEY=sk-xxxxx
177 | export WEATHER_API_KEY=xxxxxx
178 | ```
179 | 
180 | The WEATHER_API_KEY is not mandatory, but you need to configure it when asking weather-related questions. You can obtain the API key from [this website](https://www.weatherapi.com/) (Same for local model usage).
181 | 
182 | ```bash
183 | kagentsys --query="Who is Andy Lau's wife?" --llm_name="gpt-3.5-turbo" --lang="en"
184 | ```
185 | 
186 | 2. **Local model usage**
187 | > To use a local model, you need to deploy the corresponding model service as described in the previous chapter
188 | ```bash
189 | kagentsys --query="Who is Andy Lau's wife?" --llm_name="kagentlms_qwen_7b_mat" \
190 | --use_local_llm --local_llm_host="localhost" --local_llm_port=8888 --lang="en"
191 | ```
192 | 
193 | 
194 | Full command arguments:
195 | 
196 | ```
197 | options:
198 |   -h, --help            show this help message and exit
199 |   --id ID               ID of this conversation
200 |   --query QUERY         User query
201 |   --history HISTORY     History of conversation
202 |   --llm_name LLM_NAME   the name of llm
203 |   --use_local_llm       Whether to use local llm
204 |   --local_llm_host LOCAL_LLM_HOST
205 |                         The host of local llm service
206 |   --local_llm_port LOCAL_LLM_PORT
207 |                         The port of local llm service
208 |   --tool_names TOOL_NAMES
209 |                         the name of llm
210 |   --max_iter_num MAX_ITER_NUM
211 |                         the number of iteration of agents
212 |   --agent_name AGENT_NAME
213 |                         The agent name
214 |   --agent_bio AGENT_BIO
215 |                         The agent bio, a short description
216 |   --agent_instructions AGENT_INSTRUCTIONS
217 |                         The instructions of how agent thinking, acting, or talking
218 |   --external_knowledge EXTERNAL_KNOWLEDGE
219 |                         The link of external knowledge
220 |   --lang {en,zh}        The language of the overall system
221 |   --max_tokens_num      Maximum length of model input
222 | ```
223 | 
224 | **Note**:
225 | 1. If you need to use the `browse_website` tool, you need to configure the [chromedriver](https://chromedriver.chromium.org/getting-started) on your server.
226 | 2. If the search fails multiple times, it may be because the network cannot access duckduckgo_search. You can solve this by setting the `http_proxy`.
227 | 
228 | #### Using Custom tools
229 | Custom tools usage can be found in <a href="examples/custom_tool_example.py">examples/custom_tool_example.py</a> 
230 | 
231 | ### Using KAgentBench Evaluation
232 | We only need two lines to evaluate the agent capabilities like:
233 | ```bash
234 | cd benchmark
235 | python infer_qwen.py qwen_benchmark_res.jsonl
236 | python benchmark_eval.py ./benchmark_eval.jsonl ./qwen_benchmark_res.jsonl
237 | ```
238 | The above command will give the results like
239 | ```
240 | plan : 31.64, tooluse : 43.30, reflextion : 33.34, conclusion : 44.85, profile : 44.78, overall : 39.85
241 | ```
242 | 
243 | Please refer to <a href="benchmark/">benchmark/</a> for more details.
244 | 
245 | ## Citation
246 | ```
247 | @article{pan2023kwaiagents,
248 |   author    = {Haojie Pan and
249 |                Zepeng Zhai and
250 |                Hao Yuan and
251 |                Yaojia Lv and
252 |                Ruiji Fu and
253 |                Ming Liu and
254 |                Zhongyuan Wang and
255 |                Bing Qin
256 |                },
257 |   title     = {KwaiAgents: Generalized Information-seeking Agent System with Large Language Models},
258 |   journal   = {CoRR},
259 |   volume    = {abs/2312.04889},
260 |   year      = {2023}
261 | }
262 | ```
263 | 


--------------------------------------------------------------------------------
/README_JA.md:
--------------------------------------------------------------------------------
  1 | <p align="left">
  2 |     <a href="README.md">English</a> ｜ <a href="README_ZH.md">中文</a> | 日本語
  3 | </p>
  4 | <br><br>
  5 | 
  6 | <p align="center">
  7 |     <img src="blob/logo.png" width="400"/>
  8 | <p>
  9 | <br>
 10 | 
 11 | <p align="center">
 12 |       📚 <a href="https://huggingface.co/datasets/kwaikeg/KAgentInstruct">データセット</a> | 📚 <a href="https://huggingface.co/datasets/kwaikeg/KAgentBench">ベンチマーク</a> | 🤗 <a href="https://huggingface.co/collections/kwaikeg/kagentlms-6551e685b5ec9f9a077d42ef">モデル</a> | 📑 <a href="http://arxiv.org/abs/2312.04889">論文</a>
 13 | <br>
 14 | 
 15 | KwaiAgents は、[Kuaishou Technology](https://www.kuaishou.com/en) の [KwaiKEG](https://github.com/KwaiKEG) によってオープンソース化されたエージェント関連の作品シリーズです。オープンソース化されたコンテンツには以下が含まれます:
 16 | 
 17 | 1. **KAgentSys-Lite**: KAgentSys-Lite は、KAgentSys のライトバージョンである。KAgentSys-Lite は、元のシステムの機能の一部を保持していますが、フル機能の対応物と比較すると、以下のような特定の相違点と制限があります: (1)より限定されたツールセット、(2)メモリメカニズムの欠如、(3)若干低下したパフォーマンス能力、(4)BabyAGI や Auto-GPT のようなオープンソースプロジェクトから進化した異なるコードベース。これらの変更にもかかわらず、KAgentSys-Lite は、利用可能な数多くのオープンソースエージェントシステムの中で同等のパフォーマンスを提供します。
 18 | 2. **KAgentLMs**: この論文で提案されているメタエージェント・チューニングによって獲得された、プランニング、リフレクション、ツール使用などのエージェント能力を持つ一連の大規模言語モデル。
 19 | 3. **KAgentInstruct**: 論文で提案された200k以上のエージェント関連命令の微調整データ（部分的に人間が編集したもの）。
 20 | 4. **KAgentBench**: Agent の能力をテストするための、3,000を超える人間による自動化された評価データ。評価項目には、計画、ツールの使用、考察、結論、プロファイリングが含まれる。
 21 | 
 22 | <table align='center'>
 23 |     <tr>
 24 |         <td align='center'><b>タイプ</b></td>
 25 |         <td align='center'><b>モデル</b></td>
 26 |         <td align='center'><b>訓練データ</b></td>
 27 |         <td align='center'><b>ベンチマークデータ</b></td>
 28 |     </tr>
 29 |     <tr>
 30 |         <td>Qwen</td>
 31 |         <td>
 32 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat">Qwen-7B-MAT</a> <br> 
 33 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_14b_mat">Qwen-14B-MAT</a> <br>
 34 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat_gguf">Qwen-7B-MAT-cpp</a> <br>
 35 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen1.5_14b_mat">Qwen1.5-14B-MAT</a>
 36 |         </td>
 37 |         <td align="center" rowspan="2"><a href="https://huggingface.co/datasets/kwaikeg/KAgentInstruct">KAgentInstruct</a></td>
 38 |         <td align="center" rowspan="2"><a href="https://huggingface.co/datasets/kwaikeg/KAgentBench">KAgentBench</a></td>
 39 |     </tr>
 40 |     <tr>
 41 |         <td>Baichuan</td>
 42 |         <td><a href="https://huggingface.co/kwaikeg/kagentlms_baichuan2_13b_mat">Baichuan2-13B-MAT</a></td>
 43 |     </tr>
 44 | </table>
 45 | 
 46 | <br>
 47 | <br>
 48 | 
 49 | <p align="center">
 50 |     <img src="blob/example.gif"/>
 51 | <p>
 52 | 
 53 | <br>
 54 | 
 55 | <p align="center">
 56 |     <img src="blob/overview.png"/>
 57 | <p>
 58 | 
 59 | ## ニュース
 60 | * 2024年4月19日 - Qwen1.5-14B-MATモデル [[リンク]](https://huggingface.co/kwaikeg/kagentlms_qwen1.5_14b_mat) がリリースされました。
 61 | * 2024年4月9日 - ベンチマーク結果が更新されました。
 62 | * 2024.1.29 - Qwen-14B-MAT [[リンク]](https://huggingface.co/kwaikeg/kagentlms_qwen_14b_mat) をリリース.
 63 | * 2023.1.5 - トレーニングデータ[[リンク]](https://huggingface.co/datasets/kwaikeg/KAgentInstruct)をリリース。
 64 | * 2023.12.27 - 🔥🔥🔥 KwaiAgents　は多くのサイトで報告されている。[[机器之心]](https://mp.weixin.qq.com/s/QhZIFL1GHH90z98gnk194g) [[Medium]](https://medium.com/@myscarletpan/can-7b-models-now-master-ai-agents-a-look-at-kwais-recent-llm-open-source-release-8b9e84647412) [[InfoQ]](https://www.infoq.cn/article/xHGJwG3b8hXSdaP4m6r0) など。
 65 | * 2023.12.13 - 公開されたベンチマークと評価コード[[リンク]](https://huggingface.co/datasets/kwaikeg/KAgentBench)をリリース
 66 | * 2023.12.08 - テクニカルレポート[[リンク]](https://arxiv.org/abs/2312.04889)をリリース
 67 | * 2023.11.17 - 初回リリース
 68 | 
 69 | ## 評価
 70 | 1. ベンチマーク結果
 71 | 
 72 | |                | Scale | Planning | Tool-use | Reflection | Concluding | Profile | Overall Score |
 73 | |----------------|-------|----------|----------|------------|------------|---------|---------------|
 74 | | GPT-3.5-turbo  |   -   |  18.55   |  26.26   |    8.06    |   37.26    |  35.42  |     25.63     |
 75 | | Llama2         |  13B  |   0.15   |   0.44   |    0.14    |   16.60    |  17.73  |      5.30     |
 76 | | ChatGLM3       |  6B   |   7.87   |  11.84   |    7.52    |   30.01    |  30.14  |     15.88     |
 77 | | Qwen           |  7B   |  13.34   |  18.00   |    7.91    |   36.24    |  34.99  |     21.17     |
 78 | | Baichuan2      |  13B  |   6.70   |  16.10   |    6.76    |   24.97    |  19.08  |     14.89     |
 79 | | ToolLlama      |  7B   |   0.20   |   4.83   |    1.06    |   15.62    |  10.66  |      6.04     |
 80 | | AgentLM        |  13B  |   0.17   |   0.15   |    0.05    |   16.30    |  15.22  |      4.88     |
 81 | | Qwen-MAT       |  7B   |  31.64   |  43.30   |   33.34    |   44.85    |  44.78  |     39.85     |
 82 | | Baichuan2-MAT  |  13B  |  37.27   |  52.97   |   37.00    |   48.01    |  41.83  |     45.34     |
 83 | | Qwen-MAT       |  14B  |  43.17   |  63.78   |   32.14    |   45.47    |  45.22  |     49.94     |
 84 | | Qwen1.5-MAT    |  14B  |  42.42   |  64.62   |   30.58    |   46.51    |  45.95  |     50.18     |
 85 | 
 86 | 
 87 | 2. 人間による評価。各結果セルには、合格率(％)と平均点(括弧内)を示す。
 88 | 
 89 | |                 | Scale   | NoAgent         | ReACT          | Auto-GPT        | KAgentSys       |
 90 | |-----------------|---------|-----------------|----------------|-----------------|-----------------|
 91 | | GPT-4           | -       | 57.21% (3.42)    | 68.66% (3.88)   | 79.60% (4.27)    | 83.58% (4.47)    |
 92 | | GPT-3.5-turbo   | -       | 47.26% (3.08)    | 54.23% (3.33)   | 61.74% (3.53)    | 64.18% (3.69)    |
 93 | | Qwen            | 7B      | 52.74% (3.23)    | 51.74% (3.20)   | 50.25% (3.11)    | 54.23% (3.27)    |
 94 | | Baichuan2       | 13B     | 54.23% (3.31)    | 55.72% (3.36)   | 57.21% (3.37)    | 58.71% (3.54)    |
 95 | | Qwen-MAT        | 7B      | -                | 58.71% (3.53)   | 65.67% (3.77)    | 67.66% (3.87)    |
 96 | | Baichuan2-MAT   | 13B     | -                | 61.19% (3.60)   | 66.67% (3.86)    | 74.13% (4.11)    |
 97 | 
 98 | 
 99 | ## ユーザーガイド
100 | 
101 | ### プリビルド環境
102 | まずビルド環境として miniconda をインストールします。次にビルド環境を作成します:
103 | ```bash
104 | conda create -n kagent python=3.10
105 | conda activate kagent
106 | pip install -r requirements.txt
107 | ```
108 | 
109 | ### AgentLMs の使用
110 | #### [vLLM](https://github.com/vllm-project/vllm) によるサービング(GPU)
111 | モデル推論サービスの導入には [vLLM](https://github.com/vllm-project/vllm) と [FastChat](https://github.com/lm-sys/FastChat) の利用を推奨します。まず、対応するパッケージをインストールする必要があります（詳細な使用方法については、2つのプロジェクトのドキュメントを参照してください）:
112 | 1. Qwen-7B-MAT の場合は、以下のコマンドで対応するパッケージをインストールしてください
113 | ```bash
114 | pip install vllm
115 | pip install "fschat[model_worker,webui]"
116 | ```
117 | 2. Baichuan-13B-MAT については、以下のコマンドで対応するパッケージをインストールしてください
118 | ```bash
119 | pip install "fschat[model_worker,webui]"
120 | pip install vllm==0.2.0
121 | pip install transformers==4.33.2
122 | ```
123 | 
124 | KAgentLM　をデプロイするには、まず1つのターミナルでコントローラを起動する必要があります。
125 | ```bash
126 | python -m fastchat.serve.controller
127 | ```
128 | 次に、シングル GPU 推論サービスを展開するには、別の端末で次のコマンドを使用します:
129 | ```bash
130 | python -m fastchat.serve.vllm_worker --model-path $model_path --trust-remote-code
131 | ```
132 | ここで `$model_path` はダウンロードしたモデルのローカルパスである。GPU が Bfloat16 をサポートしていない場合は、コマンドラインに`--dtype half` を追加することができます。
133 | 
134 | 第3に、3番目の端末で REST API サーバーを起動する。
135 | ```bash
136 | python -m fastchat.serve.openai_api_server --host localhost --port 8888
137 | ```
138 | 
139 | 最後に、OpenAI の呼び出し形式と同じように、curl コマンドを使ってモデルを呼び出すことができます。以下に例を示します:
140 | ```bash
141 | curl http://localhost:8888/v1/chat/completions \
142 | -H "Content-Type: application/json" \
143 | -d '{"model": "kagentlms_qwen_7b_mat", "messages": [{"role": "user", "content": "Who is Andy Lau"}]}'
144 | ```
145 | ここで、`kagentlms_qwen_7b_mat` をデプロイしたモデルに変更する。
146 | 
147 | #### [Lamma.cpp](https://github.com/ggerganov/llama.cpp)によるサービング (CPU)
148 | llama-cpp-python は、OpenAI API のドロップイン置き換えとして機能することを目的としたウェブサーバーを提供します。これにより、llama.cpp 互換のモデルを OpenAI 互換のクライアント（言語ライブラリやサービスなど）で使うことができます。変換されたモデルは [kwaikeg/kagentlms_qwen_7b_mat_gguf](https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat_gguf) にあります。
149 | 
150 | サーバーパッケージをインストールして開始するには:
151 | ```bash
152 | pip install "llama-cpp-python[server]"
153 | python3 -m llama_cpp.server --model kagentlms_qwen_7b_mat_gguf/ggml-model-q4_0.gguf --chat_format chatml --port 8888
154 | ```
155 | 
156 | 最後に、OpenAI の呼び出し形式と同じように、curl コマンドを使ってモデルを呼び出すことができます。以下に例を示します:
157 | ```bash
158 | curl http://localhost:8888/v1/chat/completions \
159 | -H "Content-Type: application/json" \
160 | -d '{"messages": [{"role": "user", "content": "Who is Andy Lau"}]}'
161 | ```
162 | 
163 | ### KAgentSys-Lite の使用
164 | KwaiAgents をダウンロードしてインストールします。Python 3.10 以上を推奨します。
165 | ```bash
166 | git clone git@github.com:KwaiKEG/KwaiAgents.git
167 | cd KwaiAgents
168 | python setup.py develop
169 | ```
170 | 
171 | 1. **ChatGPT の使用**
172 | 環境変数を宣言する
173 | ```
174 | export OPENAI_API_KEY=sk-xxxxx
175 | export WEATHER_API_KEY=xxxxxx
176 | ```
177 | 
178 | WEATHER_API_KEY は必須ではないが、気象関連の質問をする際には設定する必要がある。API キーは[このサイト](https://www.weatherapi.com/)から取得できます（ローカルモデル利用時も同じ）。
179 | 
180 | ```bash
181 | kagentsys --query="Who is Andy Lau's wife?" --llm_name="gpt-3.5-turbo" --lang="en"
182 | ```
183 | 
184 | 2. **ローカルモデルの使用**
185 | > ローカルモデルを使うためには、前の章で説明したように、対応するモデルサービスをデプロイする必要があります
186 | ```bash
187 | kagentsys --query="Who is Andy Lau's wife?" --llm_name="kagentlms_qwen_7b_mat" \
188 | --use_local_llm --local_llm_host="localhost" --local_llm_port=8888 --lang="en"
189 | ```
190 | 
191 | 
192 | 全コマンド引数:
193 | 
194 | ```
195 | options:
196 |   -h, --help            このヘルプメッセージを表示して終了する
197 |   --id ID               この会話の ID
198 |   --query QUERY         ユーザーのクエリ
199 |   --history HISTORY     会話の履歴
200 |   --llm_name LLM_NAME   llm の名前
201 |   --use_local_llm       ローカル llm を使うかどうか
202 |   --local_llm_host LOCAL_LLM_HOST
203 |                         ローカル llm サービスのホスト
204 |   --local_llm_port LOCAL_LLM_PORT
205 |                         ローカル llm サービスのポート
206 |   --tool_names TOOL_NAMES
207 |                         llm の名前
208 |   --max_iter_num MAX_ITER_NUM
209 |                         エージェントの繰り返し数
210 |   --agent_name AGENT_NAME
211 |                         エージェント名
212 |   --agent_bio AGENT_BIO
213 |                         エージェントの経歴、簡単な説明
214 |   --agent_instructions AGENT_INSTRUCTIONS
215 |                         エージェントの思考、行動、会話方法の指示
216 |   --external_knowledge EXTERNAL_KNOWLEDGE
217 |                         外部のナレッジのリンク
218 |   --lang {en,zh}        システム全体の言語
219 |   --max_tokens_num      モデル入力の最大長
220 | ```
221 | 
222 | **注**:
223 | 1. `browse_website` ツールを使用する必要がある場合は、サーバーで [chromedriver](https://chromedriver.chromium.org/getting-started) を設定する必要があります。
224 | 2. 検索に何度も失敗する場合は、ネットワークが duckduckgo_search にアクセスできないためかもしれません。`http_proxy` を設定することで解決できます。
225 | 
226 | #### カスタムツールの使用
227 | カスタムツールの使用方法は<a href="examples/custom_tool_example.py">examples/custom_tool_example.py</a>で見つけることができます"
228 | 
229 | ### KAgentBench 評価の使用
230 | エージェントの能力を評価するために必要なのは、以下の2行だけです:
231 | ```bash
232 | cd benchmark
233 | python infer_qwen.py qwen_benchmark_res.jsonl
234 | python benchmark_eval.py ./benchmark_eval.jsonl ./qwen_benchmark_res.jsonl
235 | ```
236 | 上記のコマンドを実行すると、次のような結果が得られます
237 | ```
238 | plan : 31.64, tooluse : 43.30, reflextion : 33.34, conclusion : 44.85, profile : 44.78, overall : 39.85
239 | ```
240 | 
241 | 詳しくは<a href="benchmark/">ベンチマーク</a>をご覧ください。
242 | 
243 | ## 引用
244 | ```
245 | @article{pan2023kwaiagents,
246 |   author    = {Haojie Pan and
247 |                Zepeng Zhai and
248 |                Hao Yuan and
249 |                Yaojia Lv and
250 |                Ruiji Fu and
251 |                Ming Liu and
252 |                Zhongyuan Wang and
253 |                Bing Qin
254 |                },
255 |   title     = {KwaiAgents: Generalized Information-seeking Agent System with Large Language Models},
256 |   journal   = {CoRR},
257 |   volume    = {abs/2312.04889},
258 |   year      = {2023}
259 | }
260 | ```
261 | 


--------------------------------------------------------------------------------
/README_ZH.md:
--------------------------------------------------------------------------------
  1 | <p align="left">
  2 |     <a href="README.md">English</a> ｜ 中文 | <a href="README_JA.md">日本語</a>
  3 | </p>
  4 | <br><br>
  5 | 
  6 | <p align="center">
  7 |     <img src="blob/logo.png" width="400"/>
  8 | <p>
  9 | <br>
 10 | 
 11 | <p align="center">
 12 |       📚 <a href="https://huggingface.co/datasets/kwaikeg/KAgentInstruct">Dataset</a> | 📚 <a href="https://huggingface.co/datasets/kwaikeg/KAgentBench">Benchmark</a> | 🤗 <a href="https://huggingface.co/collections/kwaikeg/kagentlms-6551e685b5ec9f9a077d42ef">Models</a> | 📑 <a href="http://arxiv.org/abs/2312.04889">Paper</a>
 13 | <br>
 14 | 
 15 | 
 16 | KwaiAgents 是[快手快知团队](https://github.com/KwaiKEG)开源的一整套Agent系列工作。开源的内容包括：
 17 | 1. **KAgentSys-Lite**：论文中KAgentSys的轻量版系统，其保留了部分原系统的功能。与功能齐全的系统相比，KAgentSys-Lite（1）缺少部分工具；（2）缺乏记忆机制；（3）性能稍有降低；（4）不同的代码库，Lite版本基于开源项目如<a href='https://github.com/yoheinakajima/babyagi'>BabyAGI</a>和<a href='https://github.com/Significant-Gravitas/AutoGPT'>Auto-GPT</a>。尽管有这些变更，KAgentSys-Lite在众多开源Agent系统中仍具有较好的性能。
 18 | 2. **KAgentLMs**：经过论文中提出的Meta-agent tuning过后，具有Agents的规划、反思、工具使用等能力的系列大模型。
 19 | 3. **KAgentInstruct**：超过20w（部分人工编辑）的Agent相关的指令微调数据。
 20 | 4. **KAgentBench**：超过3k条经人工编辑的自动化评测Agent能力数据，能力评测维度包含规划、工具使用、反思、总结、人设指令等。
 21 | 
 22 | <br>
 23 | <table align='center'>
 24 |     <tr>
 25 |         <td align='center'><b>类别</b></td>
 26 |         <td align='center'><b>模型</b></td>
 27 |         <td align='center'><b>训练数据</b></td>
 28 |         <td align='center'><b>评测数据</b></td>
 29 |     </tr>
 30 |     <tr>
 31 |         <td>Qwen</td>
 32 |         <td>
 33 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat">Qwen-7B-MAT</a> <br> 
 34 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_14b_mat">Qwen-14B-MAT</a> <br>
 35 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat_gguf">Qwen-7B-MAT-cpp</a> <br>
 36 |             <a href="https://huggingface.co/kwaikeg/kagentlms_qwen1.5_14b_mat">Qwen1.5-14B-MAT</a>
 37 |         </td>
 38 |         <td align="center" rowspan="2"><a href="https://huggingface.co/datasets/kwaikeg/KAgentInstruct">KAgentInstruct</a></td>
 39 |         <td align="center" rowspan="2"><a href="https://huggingface.co/datasets/kwaikeg/KAgentBench">KAgentBench</a></td>
 40 |     </tr>
 41 |     <tr>
 42 |         <td>Baichuan</td>
 43 |         <td><a href="https://huggingface.co/kwaikeg/kagentlms_baichuan2_13b_mat">Baichuan2-13B-MAT</a></td>
 44 |     </tr>
 45 | </table>
 46 | 
 47 | <br>
 48 | <br>
 49 | 
 50 | <p align="center">
 51 |     <img src="blob/example-zh.gif">
 52 | </p>
 53 | 
 54 | <br>
 55 | 
 56 | <p align="center">
 57 |     <img src="blob/overview.png"/>
 58 | <p>
 59 | 
 60 | ## 动态
 61 | * 2024.4.19 - Qwen1.5-14B-MAT模型[[link]](https://huggingface.co/kwaikeg/kagentlms_qwen1.5_14b_mat) 公开.
 62 | * 2024.4.9 - Benchmark结果更新.
 63 | * 2024.1.29 - Qwen-14B-MAT模型 [[link]](https://huggingface.co/kwaikeg/kagentlms_qwen_14b_mat) 公开.
 64 | * 2023.1.5 - 训练数据 [[link]](https://huggingface.co/datasets/kwaikeg/KAgentInstruct) 公开.
 65 | * 2023.12.27 - 🔥🔥🔥 KwaiAgents 被国内外多个媒体报道[[机器之心]](https://mp.weixin.qq.com/s/QhZIFL1GHH90z98gnk194g) [[Medium]](https://medium.com/@myscarletpan/can-7b-models-now-master-ai-agents-a-look-at-kwais-recent-llm-open-source-release-8b9e84647412) [[InfoQ]](https://www.infoq.cn/article/xHGJwG3b8hXSdaP4m6r0)等.
 66 | * 2023.12.13 - Benchmark和评测脚本 [[link]](https://huggingface.co/datasets/kwaikeg/KAgentBench) 公开.
 67 | * 2023.12.08 - 技术报告 [[link]](https://arxiv.org/abs/2312.04889) 公开.
 68 | * 2023.11.17 - 项目公开.
 69 | 
 70 | ## 评测表现
 71 | 1. KAgentLMs在Benchmark上的表现
 72 | 
 73 | |                | Scale | Planning | Tool-use | Reflection | Concluding | Profile | Overall Score |
 74 | |----------------|-------|----------|----------|------------|------------|---------|---------------|
 75 | | GPT-3.5-turbo  |   -   |  18.55   |  26.26   |    8.06    |   37.26    |  35.42  |     25.63     |
 76 | | Llama2         |  13B  |   0.15   |   0.44   |    0.14    |   16.60    |  17.73  |      5.30     |
 77 | | ChatGLM3       |  6B   |   7.87   |  11.84   |    7.52    |   30.01    |  30.14  |     15.88     |
 78 | | Qwen           |  7B   |  13.34   |  18.00   |    7.91    |   36.24    |  34.99  |     21.17     |
 79 | | Baichuan2      |  13B  |   6.70   |  16.10   |    6.76    |   24.97    |  19.08  |     14.89     |
 80 | | ToolLlama      |  7B   |   0.20   |   4.83   |    1.06    |   15.62    |  10.66  |      6.04     |
 81 | | AgentLM        |  13B  |   0.17   |   0.15   |    0.05    |   16.30    |  15.22  |      4.88     |
 82 | | Qwen-MAT       |  7B   |  31.64   |  43.30   |   33.34    |   44.85    |  44.78  |     39.85     |
 83 | | Baichuan2-MAT  |  13B  |  37.27   |  52.97   |   37.00    |   48.01    |  41.83  |     45.34     |
 84 | | Qwen-MAT       |  14B  |  43.17   |  63.78   |   32.14    |   45.47    |  45.22  |     49.94     |
 85 | | Qwen1.5-MAT    |  14B  |  42.42   |  64.62   |   30.58    |   46.51    |  45.95  |     50.18     |
 86 | 
 87 | 
 88 | 2. KAgentSys在人工评测上的表现 （百分号前的表示通过率，括号后表示平均分）
 89 | 
 90 | |                 | Scale   | NoAgent         | ReACT          | Auto-GPT        | KAgentSys       |
 91 | |-----------------|---------|-----------------|----------------|-----------------|-----------------|
 92 | | GPT-4           | -       | 57.21% (3.42)    | 68.66% (3.88)   | 79.60% (4.27)    | 83.58% (4.47)    |
 93 | | GPT-3.5-turbo   | -       | 47.26% (3.08)    | 54.23% (3.33)   | 61.74% (3.53)    | 64.18% (3.69)    |
 94 | | Qwen            | 7B      | 52.74% (3.23)    | 51.74% (3.20)   | 50.25% (3.11)    | 54.23% (3.27)    |
 95 | | Baichuan2       | 13B     | 54.23% (3.31)    | 55.72% (3.36)   | 57.21% (3.37)    | 58.71% (3.54)    |
 96 | | Qwen-MAT        | 7B      | -                | 58.71% (3.53)   | 65.67% (3.77)    | 67.66% (3.87)    |
 97 | | Baichuan2-MAT   | 13B     | -                | 61.19% (3.60)   | 66.67% (3.86)    | 74.13% (4.11)    |
 98 | 
 99 | ## 使用指南
100 | 
101 | ### AgentLMs 系列模型使用
102 | #### 在GPU上用vLLM部署
103 | 我们建议用[vLLM](https://github.com/vllm-project/vllm)和[FastChat](https://github.com/lm-sys/FastChat)来部署模型推理服务，首先需要安装对应的包(详细使用请参考两个项目对应文档)：
104 | 1. 对于 Qwen-7B-MAT，按如下方法安装
105 | ```bash
106 | pip install vllm
107 | pip install "fschat[model_worker,webui]"
108 | ```
109 | 1. 对于 Baichuan-13B-MAT，按如下方法安装
110 | ```bash
111 | pip install "fschat[model_worker,webui]"
112 | pip install vllm==0.2.0
113 | pip install transformers==4.33.2
114 | ```
115 | 
116 | 为了能够部署KAgentLMs系列模型，首先需要在一个终端开启controler
117 | ```bash
118 | python -m fastchat.serve.controller
119 | ```
120 | 然后，再在另一个终端开启单卡模型推理服务部署
121 | ```bash
122 | python -m fastchat.serve.vllm_worker --model-path $model_path --trust-remote-code
123 | ```
124 | 其中`$model_path`为从huggingface中下载的模型本地路径，如果显示GPU不支持Bfloat16，可以再命令行后再加个`--dtype half`。
125 | 然后，在第三个终端上开启REST API服务器
126 | ```bash
127 | python -m fastchat.serve.openai_api_server --host localhost --port 8888
128 | ```
129 | 
130 | 最后你就可以用curl命令对应OpenAI调用格式进行模型调用啦，参考示例：
131 | ```bash
132 | curl http://localhost:8888/v1/chat/completions \
133 | -H "Content-Type: application/json" \
134 | -d '{"model": "kagentlms_qwen_7b_mat", "messages": [{"role": "user", "content": "刘德华是谁"}]}'
135 | ```
136 | 这里 `kagentlms_qwen_7b_mat` 要改成你部署的模型。
137 | 
138 | #### 在CPU上用[Lamma.cpp](https://github.com/ggerganov/llama.cpp)部署
139 | llama-cpp-python 提供了类似OpenAI的API Web接口，我们可以按如下方法安装和部署。转换后的模型可以在[kwaikeg/kagentlms_qwen_7b_mat_gguf](https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat_gguf)上找到。
140 | ```bash
141 | pip install "llama-cpp-python[server]"
142 | python3 -m llama_cpp.server --model kagentlms_qwen_7b_mat_gguf/ggml-model-q4_0.gguf --chat_format chatml --port 8888
143 | ```
144 | 
145 | 最后你就可以用curl命令对应OpenAI调用格式进行模型调用啦，参考示例：
146 | ```bash
147 | curl http://localhost:8888/v1/chat/completions \
148 | -H "Content-Type: application/json" \
149 | -d '{"messages": [{"role": "user", "content": "刘德华是谁"}]}'
150 | ```
151 | 
152 | ### KAgentSys-Lite 快速使用
153 | 下载并安装环境包，建议Python>=3.10
154 | ```bash
155 | git clone git@github.com:KwaiKEG/KwaiAgents.git
156 | cd KwaiAgents
157 | python setup.py develop
158 | ```
159 | 
160 | 1. **ChatGPT调用**
161 | 声明一些环境变量
162 | ```
163 | export OPENAI_API_KEY=sk-xxxxx
164 | export WEATHER_API_KEY=xxxxxx
165 | ```
166 | 
167 | 其中WEATHER_API_KEY不是必须，但问到天气相关的问题时需要进行配置，APIKEY可以从[这个网站](https://www.weatherapi.com/)中获取（本地模型调用同）。
168 | 
169 | ```bash
170 | kagentsys --query="刘德华老婆是谁？" --llm_name="gpt-3.5-turbo" --lang="zh"
171 | ```
172 | 
173 | 1. **本地模型调用**
174 | > 调用本地模型需要参考上一章部署对应模型服务
175 | ```bash
176 | kagentsys --query="刘德华老婆是谁？" --llm_name="kagentlms_qwen_7b_mat" \
177 | --use_local_llm --local_llm_host="localhost" --local_llm_port=8888 --lang="zh"
178 | ```
179 | 
180 | 下面是完整的命令行参数
181 | 
182 | | 参数名 | 类型 | 默认值 | 描述 |
183 | | ----- | ---- | ------ | --- |
184 | | --id | str | test | 对话的ID |
185 | | --query | str |  | 用户查询问题 |
186 | | --history | str | [] | 对话历史 |
187 | | --llm_name | str | gpt-3.5-turbo | LLM的名称 |
188 | | --use_local_llm | str | False | 是否使用本地LLM |
189 | | --local_llm_host | str | localhost | 本地LLM部署的IP |
190 | | --local_llm_port | int | 8888 | 本地LLM部署的端口 |
191 | | --tool_names | str | ["auto"] | 使用工具的列表，可选有 web_search,browse_website,get_weather_info,get_calendar_info,time_delta,get_solar_terms_info |
192 | | --max_iter_num | int | 1 | agent迭代次数 |
193 | | --agent_name | str |  | agent名称 |
194 | | --agent_bio | str |  | agent简介，简短的描述 |
195 | | --agent_instructions | str | | agent的指导原则，描述agent如何思考、行动、或交流 |
196 | | --external_knowledge | str |  | 外部知识链接 |
197 | | --lang | str | en | 系统的语言，可选（英语/中文） |
198 | | --max_tokens_num | int | 4096 | Prompt截断最大长度 |
199 | 
200 | **提示**：
201 | 1. 如果需要用到 browse_website 工具，需要在服务器上配置[chromedriver](https://chromedriver.chromium.org/getting-started)
202 | 2. 如果多次显示搜索失败，可能是网络无法访问duckduckgo_search，可以通过设置`http_proxy`解决
203 | 
204 | #### 使用自定义工具
205 | 自定义工具使用可参考这个例子 <a href="examples/custom_tool_example.py">examples/custom_tool_example.py</a> 
206 | 
207 | ### KAgentBench效果评估
208 | 仅需两行代码就可以:
209 | ```bash
210 | cd benchmark
211 | python infer_qwen.py qwen_benchmark_res.jsonl
212 | python benchmark_eval.py ./benchmark_eval.jsonl ./qwen_benchmark_res.jsonl
213 | ```
214 | 上面的命令会输出以下结果
215 | ```
216 | plan : 31.64, tooluse : 43.30, reflextion : 33.34, conclusion : 44.85, profile : 44.78, overall : 39.85
217 | ```
218 | 更多细节请参考 <a href="benchmark/">benchmark/</a> 
219 | 
220 | 
221 | ## Citation
222 | ```
223 | @article{pan2023kwaiagents,
224 |   author    = {Haojie Pan and
225 |                Zepeng Zhai and
226 |                Hao Yuan and
227 |                Yaojia Lv and
228 |                Ruiji Fu and
229 |                Ming Liu and
230 |                Zhongyuan Wang and
231 |                Bing Qin
232 |                },
233 |   title     = {KwaiAgents: Generalized Information-seeking Agent System with Large Language Models},
234 |   journal   = {CoRR},
235 |   volume    = {abs/2312.04889},
236 |   year      = {2023}
237 | }
238 | ```
239 | 


--------------------------------------------------------------------------------
/benchmark/README.md:
--------------------------------------------------------------------------------
  1 | 
  2 | KAgentBench is the benchmark proposed in KwaiAgents ([Github](https://github.com/KwaiKEG/KwaiAgents)), which is a series of Agent-related works open-sourced by the [KwaiKEG](https://github.com/KwaiKEG) from [Kuaishou Technology](https://www.kuaishou.com/en). It contains over 3,000 human-edited, automated evaluation data for testing Agent capabilities, with evaluation dimensions including planning, tool-use, reflection, concluding, and profiling.
  3 | 
  4 | 
  5 | ## Overall statistics of KAgentBench
  6 | ---
  7 | 
  8 | | type| #Queries | #Inst | Avg. #Ground | Avg. #Tools | Avg. #Turns | Avg. #Tasks | Avg. Len-Know | Metric |
  9 | | :-------: | :-------:| :-------: | :-------: | :-------: | :-------: | :-------: | :-------: | :-------: |
 10 | | Planning & Tool-use  |  320   |  1,317  |  4.12 |  8.68 |  1.51  |  2.21 |  245.31 |  ROUGE-L, EM |
 11 | | Reflection  |  68   |  272  |  4 |  12 |  1 |  3.97 |  1369.04 |  ROUGE-L, EM |
 12 | | Concluding  |  245   |  1,225 |  5 |  - |  1.52 |  2.14 |  923.96 |  ROUGE-L |
 13 | | Profile  |  433   |  433 |  5 |  - |  1.99 |  - |  - |  ROUGE-L |
 14 | 
 15 | 
 16 | 
 17 | 
 18 | ##  Experimental results of different LLMs on KAgentBench
 19 | ---
 20 | The specific performance of different models on benchmarks can be seen in more detail in our [paper](https://arxiv.org/abs/2312.04889).
 21 | 
 22 | |                | Scale | Planning | Tool-use | Reflection | Concluding | Profile | Overall Score |
 23 | |----------------|-------|----------|----------|------------|------------|---------|---------------|
 24 | | GPT-3.5-turbo  |   -   |  18.55   |  26.26   |    8.06    |   37.26    |  35.42  |     25.63     |
 25 | | Llama2         |  13B  |   0.15   |   0.44   |    0.14    |   16.60    |  17.73  |      5.30     |
 26 | | ChatGLM3       |  6B   |   7.87   |  11.84   |    7.52    |   30.01    |  30.14  |     15.88     |
 27 | | Qwen           |  7B   |  13.34   |  18.00   |    7.91    |   36.24    |  34.99  |     21.17     |
 28 | | Baichuan2      |  13B  |   6.70   |  16.10   |    6.76    |   24.97    |  19.08  |     14.89     |
 29 | | ToolLlama      |  7B   |   0.20   |   4.83   |    1.06    |   15.62    |  10.66  |      6.04     |
 30 | | AgentLM        |  13B  |   0.17   |   0.15   |    0.05    |   16.30    |  15.22  |      4.88     |
 31 | | Qwen-MAT       |  7B   |  31.64   |  43.30   |   33.34    |   44.85    |  44.78  |     39.85     |
 32 | | Baichuan2-MAT  |  13B  |  37.27   |  52.97   |   37.00    |   48.01    |  41.83  |     45.34     |
 33 | 
 34 | 
 35 | 
 36 | ## JSON Format
 37 | ---
 38 | 
 39 | Each data point is
 40 | a dict with the following keys:
 41 | - `id`: a unique id for this data point. This is useful for evaluation.
 42 | - `query`: a string.
 43 | - `type`: a string, the type of this data(plantooluse,reflextion,conclusion,profile).
 44 | - `golden_result_list`: a list. The reference response.
 45 | - `funcs`: a list of functions that may be used in the current query
 46 | - `prompt_input`: a dict,input composed of different prompt templates
 47 | - `memory`: a string
 48 | - `memory_type`: a string,types of memory: task, knowledge, conversation
 49 | - `memory_last_task`: a list, in the case where memory is task, the last task information in the previous round
 50 | 
 51 | The overall data format is as follows
 52 | ```json
 53 | {
 54 |   "id": "",
 55 |   "query": "",
 56 |   "type": "",
 57 |   "golden_result_list": [],
 58 |   "funcs": [],
 59 |   "prompt_input": {},
 60 |   "memory": "",
 61 |   "memory_type": "",
 62 |   "memory_last_task": {}
 63 | }
 64 | ```
 65 | 
 66 | ## How to download benchmark
 67 | ---
 68 | 
 69 | You can download the benchmark evaluation set through [kwaikeg/KAgentBench](https://huggingface.co/datasets/kwaikeg/KAgentBench/tree/main), or you can also download the benchmark evaluation set on [KwaiAgents](https://github.com/KwaiKEG/KwaiAgents).
 70 | The filename of the evaluation set is 'benchmark_eval.jsonl'. Download the file to your local system.
 71 | 
 72 | ## Environment Setup
 73 | ---
 74 | 
 75 | Please make sure you have setup the environment and installed the required packages. Make sure you meet the above requirements, and then install the dependent libraries.
 76 | ```bash
 77 | pip install -r requirements.txt
 78 | ```
 79 | 
 80 | ## Benchmark Inference
 81 | To run benchmark evaluations using different models, it is necessary to appropriately load and predict according to the model in the inference script. Different models may have variations in their initialization and loading methods. We have provided inference scripts for both the Qianwen and Baichuan models. Inference for other models can be adapted based on the scripts we have provided.
 82 | Taking the provided open-source model kagentlms_qwen_7b_mat as an example.（The kagentlms_qwen_7b_mat model has been uploaded to [huggingface](https://huggingface.co/kwaikeg/kagentlms_qwen_7b_mat)）
 83 | Run the script to perform benchmark predictions. The parameter is the prediction results file.
 84 | ```bash
 85 | python infer_qwen.py qwen_benchmark_res.jsonl
 86 | ```
 87 | Similarly, to perform evaluations using the 'kagentlms_baichuan2_13b_mat' model, execute the following command.
 88 | ```bash
 89 | python infer_baichuan.py baichuan_benchmark_res.jsonl
 90 | ```
 91 | The prediction results will be stored in the 'model_predict' field, which is a dictionary (dict) structure. The key is the type of prompt, and the corresponding value is the output of the model. In the 'profile', as it contains only one prompt, 'model_predict' is a string, and the corresponding value is the model output.
 92 | 
 93 | Below is an example display of a prediction result for 'conclusion' data.
 94 | ```json
 95 | {
 96 |   "query": "在过去的一年中，哪个月份的全球气温最高？",
 97 |   "id": "0ae75cf4-8897-5998-b74c-c7ae7202621c",
 98 |   "type": "conclusion",
 99 |   "memory_type": "task",
100 |   "memory": "...",
101 |   "funcs": [],
102 |   "memory_last_task": {},
103 |   "golden_result_list": [
104 |     "2022年中，6月是全球最高气温。",
105 |     "2022年中，全球最高气温是6月。",
106 |     "2022年中，全球最高气温是6月。",
107 |     "2022年中，6月是全球最高气温。",
108 |     "2022年中，全球最高气温是6月。"
109 |   ],
110 |   "prompt_input": {...},
111 |   "model_predict": {
112 |     "ReACT": "2022年7月的全球气温最高，达到了17.23℃。",
113 |     "AutoGPT": "在过去的一年中，全球气温最高的月份是2023年4月，全球表面平均气温达到了17.23°C，创下了历史新高。这一数据来自于美国国家海洋和大气管理局与美国缅因大学汇编的初步数据。",
114 |     "ModelScope": "在过去一年中，全球气温最高的月份是2023年7月。根据美国国家航空航天局（NASA）和美国国家海洋和大气管理局（NOAA）的最新研究报告，2022年是史上排名第6的最热年份，尽管拉尼娜现象改变了天气模式，抑制了全球气温。然而，2023年7月的全球平均气温达到了17.23℃，超过了7月4日和5日创下的17.18℃的联合纪录，而后者之前曾打破了7月3日创下的17.01℃的纪录。",
115 |     "ToolLlama": "Thought: I have found the information about the warmest month in 2022 in the memory. I will use this information to answer the question and call the Finish function to provide the final answer.\nAction: Finish\nAction Input: {\"return_type\": \"give_answer\", \"final_answer\": \"在2022年，全球最暖的月份是5月，比20世纪平均值高出1.39°F（0.77°C）。\"}",
116 |     "Kuaiagent": "在过去的一年中，全球气温最高的月份是2023年7月。根据美国国家航空航天局（NASA）和美国国家海洋和大气管理局（NOAA）的最新研究报告，2023年7月的全球平均气温达到了17.23℃，超过了19世纪50年代有仪器记录以来的任何一个月。"
117 |   }
118 | }
119 | ```
120 | '...' indicates that the content is too extensive. For the sake of convenient display format, the content has been abbreviated.
121 | 
122 | 
123 | 
124 | 
125 | 
126 | 
127 | ## Evaluation
128 | Taking the inference results of the 'kagentlms_qwen_7b_mat' model as an example, calculate the metrics based on the benchmark inference results obtained from the 'infer'. Execute the following command to get the overall score.
129 | 
130 | The first parameter is the benchmark evaluation set, which contains reference responses manually annotated, and the second parameter is the prediction results of the model being evaluated.
131 | ```bash
132 | python benchmark_eval.py ./benchmark_eval.jsonl ./qwen_benchmark_res.jsonl
133 | ```
134 | The final model score is as follows:
135 | ```bash
136 | plan : 31.64, tooluse : 43.30, reflextion : 33.34, conclusion : 44.85, profile : 44.78, overall : 39.85
137 | ```
138 | 
139 | ## Citation
140 | ```
141 | @article{pan2023kwaiagents,
142 |   author    = {Haojie Pan and
143 |                Zepeng Zhai and
144 |                Hao Yuan and
145 |                Yaojia Lv and
146 |                Ruiji Fu and
147 |                Ming Liu and
148 |                Zhongyuan Wang and
149 |                Bing Qin
150 |                },
151 |   title     = {KwaiAgents: Generalized Information-seeking Agent System with Large Language Models},
152 |   journal   = {CoRR},
153 |   volume    = {abs/2312.04889},
154 |   year      = {2023}
155 | }
156 | ```


--------------------------------------------------------------------------------
/benchmark/benchmark_eval.py:
--------------------------------------------------------------------------------
  1 | """
  2 | 进行benchmark的评估，包括：plan、tooluse、reflextion、conclusion、profile和最终score
  3 | """
  4 | import json, re, math, sys, logging, nltk, os, unicodedata, pandas as pd, time
  5 | import contextlib
  6 | import jsonlines
  7 | from tqdm import tqdm
  8 | from typing import Optional
  9 | from rouge import Rouge 
 10 | from rouge_chinese import Rouge as RougeCh 
 11 | from nltk.translate.bleu_score import sentence_bleu
 12 | from collections import defaultdict
 13 | print(sys.getrecursionlimit())
 14 | 
 15 | # Rouge的LCS使用，增大递归次数
 16 | sys.setrecursionlimit(4096 * 4096)
 17 | 
 18 | nltk.download('punkt')
 19 | 
 20 | def mixed_tokenize(sentence):
 21 |     tokens = nltk.word_tokenize(sentence)
 22 |     result = []
 23 |     for token in tokens:
 24 |         if any('Lo' == unicodedata.category(ch) for ch in token):
 25 |             # 'Lo' is the unicode category of all non-punctuation/symbol CJK characters # result.extend(jieba.cut(token, cut_all=False))
 26 |             result.extend(list(token))
 27 |         else:
 28 |             result.append(token)
 29 |     return result
 30 | 
 31 | 
 32 | def rouge_score(label,predict):
 33 |     """
 34 |     计算rouge-L 
 35 |     """
 36 |     label,predict = str(label), str(predict)
 37 |     if label == '' or predict == '':
 38 |         return 0
 39 |     rouge = RougeCh()
 40 |     predict = " ".join(mixed_tokenize(predict))
 41 |     label = " ".join(mixed_tokenize(label))
 42 |     scores = rouge.get_scores(predict, label)
 43 |     return scores[0]["rouge-l"]["f"]
 44 | 
 45 | 
 46 | def autogpt_response_process(gpt_out):
 47 |     if "web_search(" in gpt_out:
 48 |         gpt_out = ""
 49 |     if "response=\"" in gpt_out:
 50 |         gpt_out = gpt_out.split("response=\"")[1].replace("\")","")
 51 |     return gpt_out
 52 | 
 53 | def toolllama_response_process(gpt_out):
 54 |     if """\"final_answer\": \"""" in gpt_out:
 55 |         gpt_out = gpt_out.split("""\"final_answer\": \"""")[1].replace("\"","").replace("}","")
 56 |     if gpt_out == "\n":
 57 |         gpt_out = ""
 58 |     return gpt_out
 59 | 
 60 | def find_json_dict(input_str, cnt=0):
 61 |     if input_str.count("{") > input_str.count("}"):
 62 |         return find_json_dict(input_str.rstrip("\n") + "\n}", cnt + 1)
 63 |     if cnt >= 5:
 64 |         return input_str
 65 |     try:
 66 |         st = input_str.index("{")
 67 |         end_str = '}\n}'
 68 |         end = input_str.rindex(end_str)
 69 |         return input_str[st:end + len(end_str)].strip()
 70 |     except json.decoder.JSONDecodeError:
 71 |         return find_json_dict(input_str.rstrip("\n") + "\n}", cnt + 1)
 72 |     except:
 73 |         return input_str
 74 | 
 75 | def add_quotes_to_property_names(json_string: str) -> str:
 76 |     """
 77 |     Add quotes to property names in a JSON string.
 78 | 
 79 |     Args:
 80 |         json_string (str): The JSON string.
 81 | 
 82 |     Returns:
 83 |         str: The JSON string with quotes added to property names.
 84 |     """
 85 | 
 86 |     def replace_func(match: re.Match) -> str:
 87 |         return f'"{match[1]}":'
 88 | 
 89 |     property_name_pattern = re.compile(r"(\w+):")
 90 |     corrected_json_string = property_name_pattern.sub(replace_func, json_string)
 91 | 
 92 |     try:
 93 |         json.loads(corrected_json_string)
 94 |         return corrected_json_string
 95 |     except json.JSONDecodeError as e:
 96 |         raise e
 97 | 
 98 | 
 99 | def balance_braces(json_string: str) -> Optional[str]:
100 |     """
101 |     Balance the braces in a JSON string.
102 | 
103 |     Args:
104 |         json_string (str): The JSON string.
105 | 
106 |     Returns:
107 |         str: The JSON string with braces balanced.
108 |     """
109 | 
110 |     open_braces_count = json_string.count("{")
111 |     close_braces_count = json_string.count("}")
112 | 
113 |     while open_braces_count > close_braces_count:
114 |         json_string += "}"
115 |         close_braces_count += 1
116 | 
117 |     while close_braces_count > open_braces_count:
118 |         json_string = json_string.rstrip("}")
119 |         close_braces_count -= 1
120 | 
121 |     with contextlib.suppress(json.JSONDecodeError):
122 |         json.loads(json_string)
123 |         return json_string
124 | 
125 | 
126 | def correct_json(json_to_load: str) -> str:
127 |     """
128 |     Correct common JSON errors.
129 |     Args:
130 |         json_to_load (str): The JSON string.
131 |     """
132 | 
133 |     try:
134 |         json.loads(json_to_load)
135 |         return json_to_load
136 |     except json.JSONDecodeError as e:
137 |         error_message = str(e)
138 |         if error_message.startswith("Invalid \\escape"):
139 |             json_to_load = fix_invalid_escape(json_to_load, error_message)
140 |         if error_message.startswith(
141 |             "Expecting property name enclosed in double quotes"
142 |         ):
143 |             json_to_load = add_quotes_to_property_names(json_to_load)
144 |             try:
145 |                 json.loads(json_to_load)
146 |                 return json_to_load
147 |             except json.JSONDecodeError as e:
148 |                 error_message = str(e)
149 |         balanced_str = balance_braces(json_to_load)
150 |         if balanced_str:
151 |             return balanced_str
152 |     return json_to_load
153 | 
154 | def fix_invalid_escape(json_to_load: str, error_message: str) -> str:
155 |     """Fix invalid escape sequences in JSON strings.
156 | 
157 |     Args:
158 |         json_to_load (str): The JSON string.
159 |         error_message (str): The error message from the JSONDecodeError
160 |           exception.
161 | 
162 |     Returns:
163 |         str: The JSON string with invalid escape sequences fixed.
164 |     """
165 |     while error_message.startswith("Invalid \\escape"):
166 |         bad_escape_location = extract_char_position(error_message)
167 |         json_to_load = (
168 |             json_to_load[:bad_escape_location] + json_to_load[bad_escape_location + 1 :]
169 |         )
170 |         try:
171 |             json.loads(json_to_load)
172 |             return json_to_load
173 |         except json.JSONDecodeError as e:
174 |             # print("json loads error - fix invalid escape", e)
175 |             error_message = str(e)
176 |     return json_to_load
177 | 
178 | def extract_char_position(error_message: str) -> int:
179 |     """Extract the character position from the JSONDecodeError message.
180 | 
181 |     Args:
182 |         error_message (str): The error message from the JSONDecodeError
183 |           exception.
184 | 
185 |     Returns:
186 |         int: The character position.
187 |     """
188 | 
189 |     char_pattern = re.compile(r"\(char (\d+)\)")
190 |     match = char_pattern.search(error_message)
191 |     if match:
192 |         return int(match[1])
193 |     else:
194 |         raise ValueError("Character position not found in the error message.")
195 | 
196 | 
197 | def get_ReACT_plan_and_tool(response, funcs):
198 |     thought, tool_name, tool_args_kv = 'None','None',{}
199 | 
200 |     thought = re.findall(r"(.+?)(?=(Final Answer|\Z|Action))", response, re.DOTALL)[0][0].strip()
201 |     
202 |     def get_react_func_key(func_name, funcs):
203 |         key = 'None'
204 |         for func in funcs:
205 |             if func['name'] == func_name:
206 |                 try:
207 |                     key = list(func['parameters']['properties'].keys())[0]
208 |                 except:
209 |                     key = 'None'
210 |         return key
211 | 
212 |     tool_name_re = re.findall(r"Action:(.+?)Action Input:", response, re.DOTALL)
213 |     if len(tool_name_re) > 0:
214 |         tool_name = tool_name_re[0].strip()
215 |         key = get_react_func_key(tool_name, funcs)
216 |         if key != 'None':
217 |             value = re.findall(r"Action Input:(.+?)(?=(Observation|\Z))", response, re.DOTALL)
218 |             if len(value) > 0:
219 |                 tool_args_kv = {
220 |                     key: value[0][0].strip()
221 |             }
222 |     
223 |     # 没有keys，统一为 None
224 |     if thought == '':
225 |         thought == 'None'
226 |     if tool_name == '':
227 |         tool_name = 'None'
228 |     if tool_args_kv == '':
229 |         tool_args_kv = {}
230 |     
231 |     return thought, tool_name, tool_args_kv
232 | 
233 | 
234 | def get_AutoGPT_plan_and_tool(response):
235 |     thought, tool_name, tool_args_kv = 'None','None',{}
236 |     try:
237 |         response = correct_json(find_json_dict(response))
238 |         res_json = json.loads(response)
239 |         assert isinstance(res_json,dict)
240 |     except:
241 |         return thought, tool_name, tool_args_kv
242 |     
243 |     if 'thoughts' in res_json:
244 |         if res_json['thoughts'] and 'text' in res_json['thoughts']:
245 |             thought = res_json['thoughts']['text']
246 | 
247 |     if 'command' in res_json:
248 |         if res_json['command'] and 'name' in res_json['command']:
249 |             tool_name = res_json['command']['name']
250 |         if res_json['command'] and 'args' in res_json['command']:
251 |             try:
252 |                 assert isinstance(res_json['command']['args'],dict)
253 |                 tool_args_kv = res_json['command']['args']
254 |             except:
255 |                 pass
256 |                 
257 |     if thought == '':
258 |         thought == 'None'
259 |     if tool_name == '':
260 |         tool_name = 'None'
261 |     if tool_args_kv == '':
262 |         tool_args_kv = {}
263 | 
264 |     return thought, tool_name, tool_args_kv
265 | 
266 | 
267 | def get_ToolLlama_plan_and_tool(response):
268 |     thought,tool_name,tool_args_kv = 'None','None',{}
269 | 
270 |     try:
271 |         thought = re.findall(r"Thought:(.+?)(?=(\Z|Action))", response, re.DOTALL)
272 |         if len(thought) > 0:
273 |             thought = thought[0][0].strip()
274 |         tool_name_re = re.findall(r"Action:(.+?)(?=(Action Input:|\Z))", response, re.DOTALL)
275 |         if len(tool_name_re) > 0:
276 |             tool_name = tool_name_re[0][0].strip()
277 |             tool = re.findall(r"Action Input:(.+?)(?=(Thought|\Z))", response, re.DOTALL)
278 |             if len(tool) > 0:
279 |                 tool = tool[0][0].strip()
280 |                 try:
281 |                     tool = correct_json(find_json_dict(tool))
282 |                     tool_json = json.loads(tool)
283 |                     assert isinstance(tool_json,dict) 
284 |                     tool_args_kv = tool_json
285 |                 except:
286 |                     # print('tool is not a dict')
287 |                     pass
288 |     except:
289 |         pass
290 | 
291 |     if thought == '':
292 |         thought == 'None'
293 |     if tool_name == '':
294 |         tool_name = 'None'
295 |     if tool_args_kv == '':
296 |         tool_args_kv = {}
297 | 
298 |     return thought, tool_name, tool_args_kv
299 | 
300 | def get_KuaiAgent_plan_and_tool(response):
301 |     thought,tool_name,tool_args_kv = 'None','None',{}
302 | 
303 |     try:
304 |         response = correct_json(find_json_dict(response))
305 |         res_json = json.loads(response)
306 |         assert isinstance(res_json,dict)
307 |     except:
308 |         # print('KuaiAgent JSON 格式错误')
309 |         return thought,tool_name,tool_args_kv
310 |     
311 |     if 'task_name' in res_json:
312 |         thought = res_json['task_name']
313 | 
314 |     if res_json and 'command' in res_json:
315 |         if 'name' in res_json['command']:
316 |             tool_name = res_json['command']['name']
317 |         if 'args' in res_json['command']:
318 |             try:
319 |                 assert isinstance(res_json['command']['args'],dict) 
320 |                 tool_args_kv = res_json['command']['args']
321 |             except:
322 |                 # print('arg is not a dict')
323 |                 pass
324 | 
325 |     if thought == '':
326 |         thought == 'None'
327 |     if tool_name == '':
328 |         tool_name = 'None'
329 |     if tool_args_kv == '':
330 |         tool_args_kv = {}
331 | 
332 |     return thought, tool_name, tool_args_kv
333 | 
334 | def get_ModelScope_plan_and_tool(response):
335 |     thought,tool_name,tool_args_kv = 'None','None',{}
336 | 
337 |     task = re.findall(r"\<\|startofthink\|\>(.+?)\<\|endofthink\|\>", response, re.DOTALL)
338 |     if len(task) > 0:
339 |         task = task[0].strip()
340 |         try:
341 |             task = correct_json(find_json_dict(task))
342 |             task = json.loads(task)
343 |             assert isinstance(task,dict)
344 |         except:
345 |             # print('KuaiAgent JSON 格式错误')
346 |             return thought,tool_name,tool_args_kv
347 | 
348 |         if task and 'api_name' in task:
349 |             tool_name = task['api_name']
350 |         if task and 'parameters' in task:
351 |             try:
352 |                 assert isinstance(task['parameters'],dict) 
353 |                 tool_args_kv = task['parameters']
354 |             except:
355 |                 # print('arg is not a dict')
356 |                 pass
357 |     
358 |     if thought == '':
359 |         thought == 'None'
360 |     if tool_name == '':
361 |         tool_name = 'None'
362 |     if tool_args_kv == '':
363 |         tool_args_kv = {}
364 |     
365 |     return thought, tool_name, tool_args_kv
366 | 
367 | 
368 | 
369 | def get_plan_metric(golden_thoughts, golden_toolnames, thought, tool_name):
370 |     plan_metrics = []
371 |     for golden_thought, golden_toolname in zip(golden_thoughts,golden_toolnames):
372 |         if golden_thought == 'None' or golden_toolname == 'None':
373 |             continue
374 |         thought_rouge = rouge_score(golden_thought, thought)
375 |         tool_em = 1 if tool_name == golden_toolname else 0
376 |         plan_metrics.append(thought_rouge * tool_em)
377 |     if len(plan_metrics) == 0:
378 |         plan_metrics = [0.]
379 |     return max(plan_metrics)
380 | 
381 | 
382 | 
383 | 
384 | def get_tool_metric(golden_toolnames, golden_tool_args, tool_name, tool_args):
385 |     tool_metrics = []
386 |     for golden_toolname, golden_tool_arg in zip(golden_toolnames, golden_tool_args):
387 |         if golden_toolname == 'None':
388 |             continue
389 |         tool_em = 1 if tool_name == golden_toolname else 0
390 |         avg_arg_rouges = []
391 |         if golden_tool_arg == {} and tool_args == {}:
392 |             avg_arg_rouges = [1.]
393 |         elif tool_args != {}:
394 |             for k,v in golden_tool_arg.items():
395 |                 match_k = False
396 |                 for k1,v1 in tool_args.items():
397 |                     if k1 == k:
398 |                         avg_arg_rouges.append(rouge_score(v, v1))
399 |                         match_k = True
400 |                         break
401 |                 if not match_k:
402 |                     avg_arg_rouges.append(0.)
403 |         else:
404 |             avg_arg_rouges = [0.]
405 |         arg_rouge = sum(avg_arg_rouges) / len(avg_arg_rouges) if len(avg_arg_rouges)>0 else 0 
406 |         tool_metrics.append(arg_rouge * tool_em)
407 | 
408 |     if len(tool_metrics) == 0:
409 |         tool_metrics = [0.]
410 |     return max(tool_metrics)
411 | 
412 | 
413 | def get_reflextion_metric(golden_thoughts, golden_toolnames, golden_tool_args, last_task_info, thought, tool_name, tool_args):
414 |     reflextion_metrics = []
415 |     for golden_thought, golden_toolname, golden_tool_arg in zip(golden_thoughts,golden_toolnames, golden_tool_args):
416 |         if golden_thought == 'None' or golden_toolname == 'None':
417 |             continue
418 |         thought_rouge = rouge_score(golden_thought, thought)
419 |         tool_em = 1 if tool_name == golden_toolname else 0
420 |         avg_arg_rouges = []
421 |         if golden_tool_arg == {} and tool_args == {}:
422 |             avg_arg_rouges = [1.]
423 |         elif tool_args != {}:
424 |             for k,v in golden_tool_arg.items():
425 |                 match_k = False
426 |                 for k1,v1 in tool_args.items():
427 |                     if k1 == k:
428 |                         avg_arg_rouges.append(rouge_score(v, v1))
429 |                         match_k = True
430 |                         break
431 |                 if not match_k:
432 |                     avg_arg_rouges.append(0.)
433 |         else:
434 |             avg_arg_rouges = [0.]
435 |         arg_rouge = sum(avg_arg_rouges) / len(avg_arg_rouges) if len(avg_arg_rouges)>0 else 0 
436 |         # 惩罚因子，如果和上一轮相同则penalty_weight为1，进行惩罚
437 |         if last_task_info["tool_name"] == golden_toolname and last_task_info["tool_args"]== golden_tool_arg:
438 |             penalty_weight = 1
439 |         else:
440 |             penalty_weight = 0
441 |         reflextion_score = (1-penalty_weight) * (0.3 * tool_em * thought_rouge + 0.7 * tool_em * arg_rouge)
442 |         reflextion_metrics.append(reflextion_score)
443 | 
444 |     return max(reflextion_metrics)
445 | 
446 | def plan_tooluse_reflextion_predict(model_predict, funcs):
447 |     
448 |     predict_parsed_list = []
449 |     for prompt, predict in model_predict.items():
450 |         if prompt == 'ReACT' and predict != "":
451 |             thought, tool_name, tool_args_kv = get_ReACT_plan_and_tool(predict, funcs)
452 |         elif prompt == 'AutoGPT':
453 |             thought, tool_name, tool_args_kv = get_AutoGPT_plan_and_tool(predict)
454 |         elif prompt == 'ToolLlama':
455 |             thought, tool_name, tool_args_kv = get_ToolLlama_plan_and_tool(predict)
456 |         elif prompt == 'ModelScope':
457 |             thought, tool_name, tool_args_kv = get_ModelScope_plan_and_tool(predict)
458 |         elif prompt == 'KuaiAgent':
459 |             thought, tool_name, tool_args_kv = get_KuaiAgent_plan_and_tool(predict)
460 |         result = {
461 |             'thought': thought,
462 |             'tool_name': tool_name,
463 |             'tool_args': tool_args_kv,
464 |         }
465 |         predict_parsed_list.append(result)
466 | 
467 |     return predict_parsed_list
468 | 
469 | def conclusion_metrics(label_dict, predict_dict):
470 |     """
471 |     计算conclusion的分数
472 |     """
473 |     all_rouge = []
474 |     for id, obj in tqdm(predict_dict.items()):
475 |         label_response_dict_list = label_dict[id]["golden_result_list"]
476 |         label_response_list = []
477 |         for i in label_response_dict_list:
478 |             label_response_list.append(i["golden_result"])
479 |         predict_parsed_list = obj["model_predict"]
480 | 
481 |         rouge_list = []
482 |         predict_pre_template_score = []
483 | 
484 |         for key,predict in predict_parsed_list.items():
485 |             # 格式单独处理
486 |             if key == "AutoGPT":
487 |                 predict = autogpt_response_process(predict)
488 |             if key == "ToolLlama":
489 |                 predict = toolllama_response_process(predict)
490 | 
491 |             predict_pre_label_score = []
492 |             if predict == "":
493 |                 predict_pre_label_score.append(0)
494 |             else:
495 |                 if type(predict) == dict:
496 |                     predict = json.dumps(predict,ensure_ascii=False)
497 |                 for label in label_response_list:
498 |                     rouge_res = rouge_score(label,predict)
499 |                     predict_pre_label_score.append(rouge_res)
500 |             predict_pre_template_score.append(max(predict_pre_label_score))
501 | 
502 |         all_rouge.append(sum(predict_pre_template_score)/len(predict_pre_template_score))
503 | 
504 |     conclusion_avg_rouge = sum(all_rouge)/len(all_rouge)
505 | 
506 |     return conclusion_avg_rouge
507 | 
508 | def profile_metrics(label_dict, predict_dict):
509 |     """
510 |     计算profile 的平均Rouge
511 |     """
512 |     all_rouge = []
513 |     for id, obj in tqdm(predict_dict.items()):
514 |         label_response_dict_list = label_dict[id]["golden_result_list"]
515 |         label_response_list = []
516 |         for i in label_response_dict_list:
517 |             label_response_list.append(i["golden_result"])
518 |         predict = obj["model_predict"]
519 | 
520 |         rouge_list = []
521 |         if predict == "":
522 |             all_rouge.append(0)
523 |         else:
524 |             for label in label_response_list:
525 |                 rouge_res = rouge_score(label,predict)
526 |                 rouge_list.append(rouge_res)
527 |             all_rouge.append(max(rouge_list))
528 |     profile_avg_rouge = sum(all_rouge)/len(all_rouge)
529 |     return profile_avg_rouge
530 | 
531 | 
532 | 
533 | def plantooluse_metrics(label_dict, predict_dict):
534 |     all_plan_rouge = []
535 |     all_tooluse_rouge = []
536 |     for id, obj in tqdm(predict_dict.items()):
537 |         label_response_list = [i for i in label_dict[id]["golden_result_list"]]
538 |         funcs = label_dict[id]["funcs"]
539 |         predict_parsed_list = plan_tooluse_reflextion_predict(obj["model_predict"], funcs)
540 |         plan_rouge_list = []
541 |         tooluse_rouge_list = []
542 |         label_thoughts = []
543 |         label_tool_names = []
544 |         label_tool_args = []
545 |         query = obj["query"]
546 |         for label in label_response_list:
547 |             label_thoughts.append(label["thought"])
548 |             label_tool_names.append(label["tool_name"])
549 |             label_tool_args.append(label['tool_args'])
550 |         for predict in predict_parsed_list:
551 |             plan_metric = get_plan_metric(label_thoughts, label_tool_names, predict['thought'], predict['tool_name'])
552 |             tool_metric = get_tool_metric(label_tool_names, label_tool_args, predict['tool_name'], predict['tool_args'])
553 |             plan_rouge_list.append(plan_metric)
554 |             tooluse_rouge_list.append(tool_metric)
555 | 
556 |         # plan_metric内部做过max，外部求mean
557 |         all_plan_rouge.append(sum(plan_rouge_list)/len(plan_rouge_list))
558 |         all_tooluse_rouge.append(sum(tooluse_rouge_list)/len(tooluse_rouge_list))
559 | 
560 |     plan_avg_score = sum(all_plan_rouge) / len(all_plan_rouge)
561 |     tooluse_avg_score = sum(all_tooluse_rouge) / len(all_tooluse_rouge)
562 |     return plan_avg_score, tooluse_avg_score
563 | 
564 | 
565 | 
566 | 
567 | def reflextion_metrics(label_dict, predict_dict):
568 |     all_reflextion_score = []
569 |     query_score = {}
570 |     for id, obj in predict_dict.items():
571 |         label_response_list = [i for i in label_dict[id]["golden_result_list"]]
572 |         predict_parsed_list = []
573 |         query = obj["query"]
574 |         funcs = label_dict[id]["funcs"]
575 |         predict_parsed_list = plan_tooluse_reflextion_predict(obj["model_predict"], funcs)
576 |         last_task_info = label_dict[id]["memory_last_task"]
577 |         reflextion_score_list = []
578 |         label_thoughts = []
579 |         label_tool_names = []
580 |         label_tool_args = []
581 |         for label in label_response_list:
582 |             label_thoughts.append(label["thought"])
583 |             label_tool_names.append(label["tool_name"])
584 |             label_tool_args.append(label['tool_args'])
585 | 
586 |         for predict in predict_parsed_list:
587 |             reflextion_metric = get_reflextion_metric(label_thoughts, label_tool_names, label_tool_args, last_task_info, predict['thought'], predict['tool_name'], predict['tool_args'])
588 |             reflextion_score_list.append(reflextion_metric)
589 |         all_reflextion_score.append(sum(reflextion_score_list)/len(reflextion_score_list))
590 | 
591 | 
592 |     reflextion_avg_score = sum(all_reflextion_score)/len(all_reflextion_score)
593 |     return reflextion_avg_score
594 | 
595 | 
596 | 
597 | 
598 | def eval(eval_file, predict_file):
599 |     """
600 |     进行整体评估
601 |     """
602 |     print(f"load eval file from {eval_file}")
603 |     print(f"load predict file from {predict_file}")
604 |     plan_tooluser_label = {}
605 |     reflextion_label = {}
606 |     conclusion_label = {}
607 |     profile_label = {}
608 | 
609 |     with jsonlines.open(eval_file,"r") as f:
610 |         for line in f:
611 |             type = line["type"]
612 |             id  = line["id"]
613 |             if type == "plantooluse":
614 | 
615 |                 plan_tooluser_label[id] = line
616 |             if type == "reflextion":
617 |                 reflextion_label[id] = line
618 |             if type == "conclusion":
619 |                 conclusion_label[id] = line 
620 |             if type == "profile":
621 |                 profile_label[id] = line
622 | 
623 | 
624 |     plan_tooluser_predict = {}
625 |     reflextion_predict = {}
626 |     conclusion_predict = {}
627 |     profile_predict = {}
628 | 
629 |     with jsonlines.open(predict_file,"r") as f:
630 |         for line in f:
631 |             type = line["type"]
632 |             id  = line["id"]
633 |             if type == "plantooluse":
634 |                 plan_tooluser_predict[id] = line
635 |             if type == "reflextion":
636 |                 reflextion_predict[id] = line
637 |             if type == "conclusion":
638 |                 conclusion_predict[id] = line 
639 |             if type == "profile":
640 | 
641 |                 profile_predict[id] = line
642 |     assert len(plan_tooluser_label) == len(plan_tooluser_predict)
643 |     assert len(reflextion_label) == len(reflextion_predict)
644 |     assert len(conclusion_label) == len(conclusion_predict)
645 |     assert len(profile_label) == len(profile_predict)
646 | 
647 |     plan_score, tooluse_score = plantooluse_metrics(plan_tooluser_label, plan_tooluser_predict)
648 |     reflextion_score = reflextion_metrics(reflextion_label, reflextion_predict)
649 |     conclusion_score = conclusion_metrics(conclusion_label, conclusion_predict)
650 |     profile_score = profile_metrics(profile_label, profile_predict)
651 |     overall_score = (
652 |         0.25 * plan_score +  # Weight for 'plantooluse' score
653 |         0.35 * tooluse_score     +  # Weight for 'tooluse' score
654 |         0.1 * reflextion_score  +  # Weight for 'reflection' score
655 |         0.2 * conclusion_score  +  # Weight for 'conclusion' score
656 |         0.1 * profile_score       # Weight for 'profile' score
657 |     )
658 |     print(f"plan : {plan_score*100:.2f}, tooluse : {tooluse_score*100:.2f}, reflextion : {reflextion_score*100:.2f}, conclusion : {conclusion_score*100:.2f}, profile : {profile_score*100:.2f}, overall : {overall_score*100:.2f}")
659 | 
660 | 
661 | 
662 | 
663 | 
664 | 
665 | if __name__ == "__main__":
666 |     eval(sys.argv[1], sys.argv[2])
667 |     
668 | 
669 | 
670 | 
671 |     
672 | 
673 | 


--------------------------------------------------------------------------------
/benchmark/infer_baichuan.py:
--------------------------------------------------------------------------------
  1 | """
  2 | benchmark形式评估集推理
  3 | """
  4 | import os
  5 | os.environ["CUDA_VISIBLE_DEVICES"] = "7"
  6 | import sys
  7 | import time
  8 | import copy
  9 | import jsonlines
 10 | from tqdm import tqdm
 11 | from vllm import LLM, SamplingParams
 12 | from transformers import AutoModelForCausalLM, AutoTokenizer
 13 | import transformers, datetime, json
 14 | 
 15 | class ChatBaichuan:
 16 |     def __init__(self,
 17 |             model_name_or_path: str = "kwaikeg/kagentlms_baichuan2_13b_mat",
 18 |             template: str = 'baichuan2',
 19 |             input_max_length = 4096,
 20 |         ) -> None:
 21 | 
 22 |         assert template in ['baichuan', 'baichuan2']
 23 |         self.template = template
 24 | 
 25 |         print('loading tokenizer')
 26 |         self.tokenizer = AutoTokenizer.from_pretrained(
 27 |             model_name_or_path,
 28 |             use_fast=False,
 29 |             padding_side='right',
 30 |             trust_remote_code=True
 31 |         )
 32 | 
 33 |         print('loading model')
 34 |         self.model = LLM(
 35 |             model = model_name_or_path,
 36 |             trust_remote_code=True, 
 37 |             max_num_batched_tokens=input_max_length
 38 |         )
 39 |         print('loaded')
 40 | 
 41 | 
 42 | 
 43 | 
 44 |     def encode(self, tokenizer, query, history, system=''):
 45 |         prompt_ids = []
 46 |         history = history + [(query, None)]
 47 |         kwargs = dict(add_special_tokens=False)
 48 |         for turn_idx, (q, r) in enumerate(history):
 49 |             prefix_ids = tokenizer.encode(system, **kwargs) if turn_idx == 0 else []
 50 |             if self.template == 'baichuan':
 51 |                 prompt = ['<reserved_102>',q,'<reserved_103>']
 52 |             elif self.template == 'baichuan2':
 53 |                 prompt = ['<reserved_106>',q,'<reserved_107>']
 54 |             query_ids = []
 55 |             for p in prompt:
 56 |                 query_ids = query_ids + tokenizer.encode(p, **kwargs)
 57 |             resp_ids = tokenizer.encode(r, **kwargs) if r is not None else []
 58 |             prompt_ids = prompt_ids + prefix_ids + query_ids + resp_ids
 59 |         return prompt_ids 
 60 | 
 61 |     def chat(self, query, *args, **kwargs):
 62 |         mode = 'SINGLE_INFER' # 单条推理
 63 | 
 64 |         try:
 65 |             if type(json.loads(query)) == list:
 66 |                 mode = 'BATCH_INFER'
 67 |         except:
 68 |             pass
 69 |     
 70 |         if mode == 'SINGLE_INFER':
 71 |             return self.chat_single(query, *args, **kwargs)
 72 |         elif mode == 'BATCH_INFER':
 73 |             return self.chat_batch(json.loads(query), *args, **kwargs)
 74 |         else:
 75 |             raise TypeError(f'query必须为str或list,当前为{type(query)}')
 76 | 
 77 |     def chat_single(self, query, history=list(), system="", chat_id=None, 
 78 |                     prune_text=None,
 79 |                     temperature=0.1,
 80 |                     top_p=0.75,
 81 |                     top_k=40,
 82 |                     repetition_penalty=1.0,
 83 |                     max_new_tokens=520,
 84 |                     input_max_length=3400,
 85 |                     *args, **kwargs
 86 |                 ):
 87 | 
 88 |         prompt_tokens = self.encode(tokenizer=self.tokenizer, query=query, history=history, system=system)
 89 |         print('token len:',len(prompt_tokens))
 90 | 
 91 |         if len(prompt_tokens) > input_max_length:
 92 |             if prune_text is None or prune_text not in query:
 93 |                 prompt_tokens = prompt_tokens[:input_max_length//2] + prompt_tokens[-input_max_length//2:]
 94 |             else:
 95 |                 print('memory截断')
 96 |                 prune_text_prompt_tokens = self.tokenizer.encode(prune_text,add_special_tokens=False)
 97 |                 sublst_len = len(prune_text_prompt_tokens)
 98 |                 start_index = None
 99 |                 for i in range(len(prompt_tokens) - sublst_len + 1):
100 |                     if prompt_tokens[i:i+sublst_len] == prune_text_prompt_tokens:
101 |                         start_index = i
102 |                         break
103 |                 
104 |                 if start_index is None:
105 |                     prompt_tokens = prompt_tokens[:input_max_length//2] + prompt_tokens[-input_max_length//2:]
106 |                 else:
107 |                     # 除了memory的其他部分的长度
108 |                     other_len = len(prompt_tokens) -  sublst_len
109 |                     if input_max_length > other_len:
110 |                         max_memory_len = input_max_length - other_len
111 |                         prune_text_prompt_tokens = prune_text_prompt_tokens[:max_memory_len//2]+prune_text_prompt_tokens[-max_memory_len//2:]
112 |                         prompt_tokens = prompt_tokens[:start_index] + prune_text_prompt_tokens + prompt_tokens[start_index+sublst_len:]
113 |                         
114 | 
115 |         prompt = self.tokenizer.decode(prompt_tokens, skip_special_tokens=True)
116 |     
117 |         gen_kwargs = dict(
118 |             temperature=temperature,
119 |             top_p=top_p,
120 |             top_k=top_k,
121 |             max_tokens=max_new_tokens,
122 |         )
123 |         
124 |         generation_output = self.model.generate(prompt, SamplingParams(**gen_kwargs))
125 | 
126 |         try:
127 |             res = generation_output[0].outputs[0]
128 |             response = res.text
129 |         except:
130 |             response = 'error'
131 | 
132 |         history = history[:] + [[query, response]]
133 | 
134 |         return response, history
135 | 
136 | 
137 | def infer_to_file(eval_file, infer_out_file, gpt_bot):
138 |     print(f"load eval data from {eval_file}")
139 |     eval_data_list  = []
140 |     with jsonlines.open(eval_file,"r") as f:
141 |         eval_data_list = [obj for obj in f]
142 |     
143 |     with jsonlines.open(infer_out_file,'w') as w:
144 |         for obj in tqdm(eval_data_list):
145 |             new_obj = copy.deepcopy(obj)
146 |             type = obj["type"]
147 |         
148 |             memory = obj["memory"]
149 |             if type == "profile":
150 |                 query = obj["prompt_input"]["prompt"]
151 |                 response, history= gpt_bot.chat(query=query, prune_text=memory)
152 |                 new_obj["model_predict"] = response
153 |             else:
154 |                 infer_dict = {}
155 |                 for prompt_key,prompt_in in obj["prompt_input"].items():
156 |                     query = prompt_in
157 |                     response, history = gpt_bot.chat(query=query, prune_text=memory)
158 |                     infer_dict[prompt_key] = response
159 |                 new_obj["model_predict"] = infer_dict
160 | 
161 |             w.write(new_obj)
162 | 
163 |     print(f"infer out save to  {infer_out_file}")
164 | 
165 | 
166 | 
167 | def run(save_file):
168 |     gpt_bot = ChatBaichuan()
169 |     eval_file = "./benchmark_eval.jsonl"
170 |     infer_to_file(eval_file,save_file,gpt_bot)
171 | 
172 | if __name__=='__main__':
173 | 
174 |     run(sys.argv[1])
175 | 


--------------------------------------------------------------------------------
/benchmark/infer_qwen.py:
--------------------------------------------------------------------------------
  1 | """
  2 | benchmark形式评估集推理
  3 | """
  4 | import os
  5 | import sys
  6 | os.environ["CUDA_VISIBLE_DEVICES"] = "7"
  7 | import time
  8 | import torch
  9 | import copy
 10 | import jsonlines
 11 | from tqdm import tqdm
 12 | from transformers import (
 13 |     AutoModelForCausalLM, AutoTokenizer
 14 | )
 15 | import torch, transformers, pdb, json
 16 | 
 17 | 
 18 | class ChatQwen:
 19 |     def __init__(self,
 20 |             model_name_or_path: str = "kwaikeg/kagentlms_qwen_7b_mat",
 21 |         ) -> None:
 22 | 
 23 |         print('loading tokenizer')
 24 |         self.tokenizer = AutoTokenizer.from_pretrained(
 25 |             model_name_or_path,
 26 |             use_fast=False,
 27 |             padding_side='left',
 28 |             trust_remote_code=True
 29 |         )
 30 |         self.tokenizer.add_special_tokens({'additional_special_tokens': ['<|im_end|>']}, replace_additional_special_tokens=False)
 31 | 
 32 |         print(f'loading model: {model_name_or_path}')
 33 |         self.model = AutoModelForCausalLM.from_pretrained(
 34 |             model_name_or_path,
 35 |             torch_dtype=torch.bfloat16,
 36 |             device_map="auto",
 37 |             trust_remote_code = True
 38 |         ).eval()
 39 |         print('loaded')
 40 | 
 41 | 
 42 | 
 43 |     def encode(self, tokenizer, query, history, system='You are a helpful assistant.'):
 44 |         prompt_ids = []
 45 |         history = history + [(query, None)]
 46 |         kwargs = dict(allowed_special="all", add_special_tokens=False)
 47 |         sep = ['<|im_end|>','\n']
 48 |         sep_ids = []
 49 |         for s in sep:
 50 |             sep_ids += tokenizer.encode(s, **kwargs)
 51 |         for turn_idx, (q, r) in enumerate(history):
 52 |             if turn_idx == 0:
 53 |                 prefix = ['<|im_start|>',f'system\n{system}']
 54 |                 prefix_ids = []
 55 |                 for p in prefix:
 56 |                     prefix_ids += tokenizer.encode(p, **kwargs)
 57 |                 prefix_ids += sep_ids
 58 |             else:
 59 |                 prefix_ids = sep_ids
 60 |             prompt = ['<|im_start|>',f'user\n{q}','<|im_end|>','\n','<|im_start|>','assistant\n']
 61 |             query_ids = []
 62 |             for p in prompt:
 63 |                 query_ids = query_ids + tokenizer.encode(p, **kwargs)
 64 |             resp_ids = tokenizer.encode(r, **kwargs) if r is not None else []
 65 |             prompt_ids = prompt_ids + prefix_ids + query_ids + resp_ids
 66 |         return prompt_ids 
 67 | 
 68 |     def chat(self, query, history=list(), system="",
 69 |                     prune_text=None,
 70 |                     num_beams=1,
 71 |                     temperature=0.1,
 72 |                     top_p=0.75,
 73 |                     top_k=40,
 74 |                     repetition_penalty=1.0,
 75 |                     max_new_tokens=520,
 76 |                     input_max_length=3096,
 77 |                     *args, **kwargs
 78 |                 ):
 79 | 
 80 |         prompt_tokens = self.encode(tokenizer=self.tokenizer, query=query, history=history, system=system)
 81 | 
 82 |         if len(prompt_tokens) > input_max_length:
 83 |             if prune_text is None or prune_text not in query:
 84 |                 prompt_tokens = prompt_tokens[:input_max_length//2] + prompt_tokens[-input_max_length//2:]
 85 |             else:
 86 |                 print('memory截断')
 87 |                 prune_text_prompt_tokens = self.tokenizer.encode(prune_text,add_special_tokens=False)
 88 |                 sublst_len = len(prune_text_prompt_tokens)
 89 |                 start_index = None
 90 |                 for i in range(len(prompt_tokens) - sublst_len + 1):
 91 |                     if prompt_tokens[i:i+sublst_len] == prune_text_prompt_tokens:
 92 |                         start_index = i
 93 |                         break
 94 |                 
 95 |                 if start_index is None:
 96 |                     prompt_tokens = prompt_tokens[:input_max_length//2] + prompt_tokens[-input_max_length//2:]
 97 |                 else:
 98 |                     # 除了memory的其他部分的长度
 99 |                     other_len = len(prompt_tokens) -  sublst_len
100 |                     if input_max_length > other_len:
101 |                         max_memory_len = input_max_length - other_len
102 |                         prune_text_prompt_tokens = prune_text_prompt_tokens[:max_memory_len//2]+prune_text_prompt_tokens[-max_memory_len//2:]
103 |                         prompt_tokens = prompt_tokens[:start_index] + prune_text_prompt_tokens + prompt_tokens[start_index+sublst_len:]
104 | 
105 | 
106 |         prompt = self.tokenizer.decode(prompt_tokens, skip_special_tokens=True)
107 |     
108 |         input_ids = torch.tensor([prompt_tokens], device=self.model.device)
109 |         prompt_length = len(input_ids[0])
110 |         gen_kwargs = dict(
111 |             input_ids = input_ids,
112 |             num_beams = num_beams,
113 |             temperature = temperature,
114 |             top_p = top_p,
115 |             top_k = top_k,
116 |             repetition_penalty = repetition_penalty
117 |         )
118 |         generation_output = self.model.generate(**gen_kwargs)
119 |         outputs = generation_output.tolist()[0][prompt_length:]
120 |         response = self.tokenizer.decode(outputs, skip_special_tokens=True)
121 | 
122 |         new_history = history[:] + [[query, response]]
123 | 
124 |         return response, new_history
125 | 
126 | def infer_to_file(eval_file, infer_out_file, gpt_bot):
127 |     print(f"load eval data from {eval_file}")
128 |     eval_data_list  = []
129 |     with jsonlines.open(eval_file,"r") as f:
130 |         eval_data_list = [obj for obj in f]
131 |     
132 |     with jsonlines.open(infer_out_file,'w') as w:
133 |         for obj in tqdm(eval_data_list):
134 |             new_obj = copy.deepcopy(obj)
135 |             type = obj["type"]
136 |         
137 |             memory = obj["memory"]
138 |             if type == "profile":
139 |                 query = obj["prompt_input"]["prompt"]
140 |                 response, history= gpt_bot.chat(query=query, prune_text=memory)
141 |                 new_obj["model_predict"] = response
142 |             else:
143 |                 infer_dict = {}
144 |                 for prompt_key,prompt_in in obj["prompt_input"].items():
145 |                     query = prompt_in
146 |                     response, history = gpt_bot.chat(query=query, prune_text=memory)
147 |                     infer_dict[prompt_key] = response
148 |                 new_obj["model_predict"] = infer_dict
149 | 
150 |             w.write(new_obj)
151 | 
152 |     print(f"infer out save to  {infer_out_file}")
153 | 
154 | 
155 | 
156 | def run(save_file):
157 |     gpt_bot = ChatQwen()
158 | 
159 |     eval_file = "./benchmark_eval.jsonl"
160 |     infer_to_file(eval_file,save_file,gpt_bot)
161 | 
162 | if __name__=='__main__':
163 | 
164 |     run(sys.argv[1])


--------------------------------------------------------------------------------
/benchmark/requirements.txt:
--------------------------------------------------------------------------------
1 | transformers_stream_generator
2 | vllm
3 | nltk
4 | pandas
5 | rouge
6 | rouge_chinese


--------------------------------------------------------------------------------
/blob/example-zh.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/KwaiKEG/KwaiAgents/3504ab8a00a3c3f5e5a4ccbd12dee64997f9561c/blob/example-zh.gif


--------------------------------------------------------------------------------
/blob/example.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/KwaiKEG/KwaiAgents/3504ab8a00a3c3f5e5a4ccbd12dee64997f9561c/blob/example.gif


--------------------------------------------------------------------------------
/blob/logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/KwaiKEG/KwaiAgents/3504ab8a00a3c3f5e5a4ccbd12dee64997f9561c/blob/logo.png


--------------------------------------------------------------------------------
/blob/overview.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/KwaiKEG/KwaiAgents/3504ab8a00a3c3f5e5a4ccbd12dee64997f9561c/blob/overview.png


--------------------------------------------------------------------------------
/examples/custom_tool_example.py:
--------------------------------------------------------------------------------
 1 | from datetime import datetime
 2 | import json
 3 | import requests
 4 | from gtrending import fetch_repos
 5 | from kwaiagents.tools.base import BaseTool, BaseResult
 6 | from kwaiagents.agents import AgentProfile, KAgentSysLite
 7 | from kwaiagents.config import Config, CFG
 8 | 
 9 | 
10 | class GithubTrendingResults(BaseResult):
11 |     @property
12 |     def answer(self):
13 |         rst = [
14 |             {
15 |                 "author": t["author"],
16 |                 "name": t["name"],
17 |                 "stars": t["stars"],
18 |                 "forks": t["forks"],
19 |                 "language": t["language"],
20 |                 "description": t["description"].strip()
21 |             } for t in self.json_data["data"]]
22 | 
23 |         return f'{self.json_data["since"]} Github Trending Results: ' + json.dumps(rst, ensure_ascii=False)
24 |     
25 |     @property
26 |     def answer_md(self):
27 |         rst = ""
28 |         for _, data in enumerate(self.json_data['data']):
29 |             rst += f'''
30 |             <h3> <a href="{data['url']}" target="_blank"> {data['fullname']} </a> ({data["stars"]} stars, {data["forks"]} forks)</h3>
31 |             <p style="color:rgb(90,98,106)"> {data["description"].strip()} </p>'''
32 |         return rst
33 | 
34 | 
35 | class GithubTrendingTool(BaseTool):
36 |     """
37 |     Retrieve GitHub trending repositories.
38 | 
39 |     Args:
40 |         since (str): Time frame, options: 'daily', 'weekly', 'monthly'.
41 | 
42 |     Returns:
43 |         str: GitHub trending results.
44 |     """
45 |     name = "github_trending"
46 |     zh_name = "Github热榜"
47 |     description = ""
48 |     tips = ""
49 | 
50 |     def __init__(self, max_item_num=10, *args, **kwargs):
51 |         self.max_item_num = max_item_num
52 |         pass
53 | 
54 |     def __call__(self, since, *args, **kwargs):
55 |         if since not in ["daily", "weekly", "monthly"]:
56 |             since = "daily"
57 |         return GithubTrendingResults({
58 |             "data": fetch_repos(since=since)[:self.max_item_num],
59 |             "since": since
60 |         })
61 | 
62 | 
63 | if __name__ == "__main__":
64 |     input_dict = {
65 |         "lang": "en",
66 |         "llm_name": "kagentlms_qwen_7b_mat",
67 |     }
68 |     agent_profile = AgentProfile(input_dict)
69 |     cfg = Config()
70 | 
71 |     llm_name = input_dict.get("llm_name", "").lower()
72 |     cfg.fast_llm_model = llm_name
73 |     cfg.smart_llm_model = llm_name
74 | 
75 |     CFG.local_llm_host = "localhost"
76 |     CFG.local_llm_port = 8888
77 |     CFG.use_local_llm = True
78 | 
79 |     agent = KAgentSysLite(
80 |             cfg=cfg,
81 |             session_id="test_trending_tools",
82 |             agent_profile=agent_profile,
83 |             tools=[GithubTrendingTool],
84 |             lang=input_dict["lang"])
85 | 
86 |     agent_results = agent.chat(
87 |             "List hottest repo today.", 
88 |             history=[])


--------------------------------------------------------------------------------
/kwaiagents/agent_start.py:
--------------------------------------------------------------------------------
  1 | import argparse
  2 | from datetime import datetime
  3 | import json
  4 | import os
  5 | import sys
  6 | import time
  7 | import traceback
  8 | from kwaiagents.config import Config, CFG
  9 | from kwaiagents.agents import KAgentSysLite, AgentProfile
 10 | 
 11 | 
 12 | class AgentService(object):
 13 |     def __init__(self, *args, **kwargs):
 14 |         self.cfg = Config()
 15 |         self.agent_profile = None
 16 |         self.p_date = datetime.today().strftime('%Y%m%d')
 17 | 
 18 |     @staticmethod
 19 |     def parse_config(input_dict):
 20 |         cfg = Config()
 21 | 
 22 |         llm_name = input_dict.get("llm_name", "").lower()
 23 |         cfg.fast_llm_model = llm_name
 24 |         cfg.smart_llm_model = llm_name
 25 |         cfg.max_tokens_num = input_dict.get("max_tokens_num", 4096)
 26 |         if llm_name == "gpt-4":
 27 |             cfg.fast_llm_model = "gpt-3.5-turbo"
 28 | 
 29 |         return cfg
 30 | 
 31 |     @staticmethod
 32 |     def load_history(input_dict):
 33 |         history = input_dict.get("history", list())
 34 |         if not history:
 35 |             history = list()
 36 |         if isinstance(history, str):
 37 |             history = json.loads(history)
 38 |         return history
 39 | 
 40 |     def chat(self, input_dict):
 41 |         s = "============ INPUT_DICT ============\n"
 42 |         for key, val in input_dict.items():
 43 |             s += f"· {key.upper()}:\t{val}\n"
 44 |         print(s)
 45 | 
 46 |         chat_id = str(input_dict["id"])
 47 |         history = self.load_history(input_dict)
 48 |         self.cfg = self.parse_config(input_dict)
 49 |         self.agent_profile = AgentProfile(input_dict)
 50 | 
 51 |         print(self.cfg)
 52 |         print(self.agent_profile)
 53 | 
 54 |         try:
 55 |             agent = KAgentSysLite(
 56 |                     cfg=self.cfg,
 57 |                     session_id=chat_id,
 58 |                     agent_profile=self.agent_profile,
 59 |                     lang=input_dict.get("lang", "en"))
 60 | 
 61 |             print("\033[95m\033[1m" + "\n***** Question *****" + "\033[0m\033[0m")
 62 |             print(input_dict["query"])
 63 | 
 64 |             agent_results = agent.chat(
 65 |                 input_dict["query"], 
 66 |                 history=history)
 67 | 
 68 |             print("\033[95m\033[1m" + "\n***** Response *****" + "\033[0m\033[0m")
 69 |             print(agent_results["response"])
 70 | 
 71 |             result = {
 72 |                 "id": chat_id,
 73 |                 "response": agent_results["response"],
 74 |                 "history": json.dumps(agent_results["history"], ensure_ascii=False),
 75 |                 "chain_msg": agent_results["chain_msg"],
 76 |                 "chain_msg_str": agent_results["chain_msg_str"],
 77 |                 "more_info": agent_results["more_info"]
 78 |             }
 79 | 
 80 |         except KeyboardInterrupt:
 81 |             exit()
 82 |         except:
 83 |             print(traceback.format_exc())
 84 |             result = {
 85 |                 "id": chat_id,
 86 |                 "response": "error"
 87 |             }
 88 | 
 89 |         return result
 90 | 
 91 | 
 92 | def main():
 93 |     parser = argparse.ArgumentParser()
 94 | 
 95 |     parser.add_argument("--id", type=str, default="test", help="ID of this conversation")
 96 |     parser.add_argument("--query", type=str, required=True, help="User query")
 97 |     parser.add_argument("--history", type=str, default='[]', help="History of conversation")
 98 |     parser.add_argument("--llm_name", type=str, default="gpt-3.5-turbo", help="the name of llm")
 99 |     parser.add_argument("--use_local_llm", default=False, action='store_true', help="Whether to use local llm")
100 |     parser.add_argument("--local_llm_host", type=str, default="localhost", help="The host of local llm service")
101 |     parser.add_argument("--local_llm_port", type=int, default="8888", help="The port of local llm service")
102 | 
103 |     parser.add_argument("--tool_names", type=str, default='["auto"]', help="the name of llm")
104 |     parser.add_argument("--max_iter_num", type=int, default=1, help="the number of iteration of agents")
105 |     parser.add_argument("--agent_name", type=str, default="", help="The agent name")
106 |     parser.add_argument("--agent_bio", type=str, default="", help="The agent bio, a short description")
107 |     parser.add_argument("--agent_instructions", type=str, default="", help="The instructions of how agent thinking, acting, or talking")
108 |     parser.add_argument("--external_knowledge", type=str, default="", help="The link of external knowledge")
109 |     parser.add_argument("--lang", type=str, default="en", choices=["en", "zh"], help="The language of the overall system")
110 |     parser.add_argument("--max_tokens_num", type=int, default=4096, help="Maximum length of model input")
111 | 
112 |     args = parser.parse_args()
113 | 
114 |     CFG.local_llm_host = args.local_llm_host
115 |     CFG.local_llm_port = args.local_llm_port
116 |     CFG.use_local_llm = args.use_local_llm
117 | 
118 |     agent_service = AgentService()
119 | 
120 |     agent_service.chat(vars(args))
121 | 
122 | 
123 | if __name__ == "__main__":
124 |     main()


--------------------------------------------------------------------------------
/kwaiagents/agents/__init__.py:
--------------------------------------------------------------------------------
1 | from .agent_profile import AgentProfile
2 | from .kagent import KAgentSysLite


--------------------------------------------------------------------------------
/kwaiagents/agents/agent_profile.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | 
 3 | 
 4 | _profile_default_name_fn = lambda x: "AI助手" if x == "zh" else "AI Assitant"
 5 | _profile_default_bio_fn = lambda x: "你能帮助人类解决他们的问题" if x == "zh" else "You can help people solve their problems"
 6 | _profile_default_instruct_pre_fn = lambda x: "你要遵循以下指令行动：\n" if x == "zh" else "You should follow these following instructions:\n"
 7 | 
 8 | 
 9 | class AgentProfile(object):
10 |     def __init__(self, input_dict: dict = None):
11 |         self.input_dict = input_dict
12 |         self.lang = input_dict.get("lang", "en")
13 |         self.from_json(input_dict)
14 | 
15 |     def from_json(self, input_dict):
16 |         self.name = input_dict.get("agent_name", "")
17 |         if not self.name:
18 |             self.name = _profile_default_name_fn(self.lang)
19 |         self.bio = input_dict.get("agent_bio", "")
20 |         if not self.bio:
21 |             self.bio = _profile_default_bio_fn(self.lang)
22 |         self.max_iter_num = int(input_dict.get("max_iter_num", 5))
23 |         self.instructions = input_dict.get("agent_instructions", "")
24 |         if self.instructions:
25 |             self.instructions = _profile_default_instruct_pre_fn(self.lang) + self.instructions
26 |         tool_names = input_dict.get("tool_names", '["auto"]')
27 |         if isinstance(tool_names, str):
28 |             self.tools = json.loads(tool_names)
29 |         else:
30 |             self.tools = tool_names
31 | 
32 |     def to_json_file(self, fname):
33 |         with open(fname, "w") as f:
34 |             json.dump({k:v for k, v in self.__dict__.items()},f, ensure_ascii=False, indent=2)
35 | 
36 |     def __str__(self):
37 |         s = "============ Agent Profile ============\n"
38 |         for key, val in self.__dict__.items():
39 |             if key == "input_dict":
40 |                 continue
41 |             s += f"· {key.upper()}:\t{val}\n"
42 |         return s
43 | 


--------------------------------------------------------------------------------
/kwaiagents/agents/kagent.py:
--------------------------------------------------------------------------------
  1 | from collections import deque
  2 | import json
  3 | import logging
  4 | import re
  5 | import sys
  6 | import time
  7 | import traceback
  8 | from typing import Dict, List
  9 | import uuid
 10 | from datetime import datetime
 11 | from lunar_python import Lunar, Solar
 12 | from transformers import AutoTokenizer
 13 | 
 14 | from kwaiagents.tools import ALL_NO_TOOLS, ALL_TOOLS, FinishTool, NoTool
 15 | from kwaiagents.llms import create_chat_completion
 16 | from kwaiagents.agents.prompts import make_planning_prompt
 17 | from kwaiagents.agents.prompts import make_no_task_conclusion_prompt, make_task_conclusion_prompt
 18 | from kwaiagents.utils.chain_logger import *
 19 | from kwaiagents.utils.json_fix_general import find_json_dict, correct_json
 20 | from kwaiagents.utils.date_utils import get_current_time_and_date
 21 | 
 22 | 
 23 | class SingleTaskListStorage:
 24 |     def __init__(self):
 25 |         self.tasks = deque([])
 26 |         self.task_id_counter = 0
 27 | 
 28 |     def append(self, task: Dict):
 29 |         self.tasks.append(task)
 30 | 
 31 |     def replace(self, tasks: List[Dict]):
 32 |         self.tasks = deque(tasks)
 33 | 
 34 |     def popleft(self):
 35 |         return self.tasks.popleft()
 36 | 
 37 |     def is_empty(self):
 38 |         return False if self.tasks else True
 39 | 
 40 |     def next_task_id(self):
 41 |         self.task_id_counter += 1
 42 |         return self.task_id_counter
 43 | 
 44 |     def get_task_names(self):
 45 |         return [t["task_name"] for t in self.tasks]
 46 |     
 47 |     def get_tasks(self):
 48 |         return list(self.tasks)
 49 | 
 50 |     def clear(self):
 51 |         del self.tasks
 52 |         self.tasks = deque([])
 53 |         self.task_id_counter = 0
 54 | 
 55 | 
 56 | class KAgentSysLite(object):
 57 |     def __init__(self, cfg, session_id=None, agent_profile=None, tools=None, lang="en"):
 58 |         self.cfg = cfg
 59 |         self.agent_profile = agent_profile
 60 |         self.lang = lang
 61 |         self.max_task_num = agent_profile.max_iter_num
 62 |         self.session_id = session_id if session_id else str(uuid.uuid1())
 63 |         self.tokenizer = self.initialize_tokenizer(self.cfg.fast_llm_model)
 64 | 
 65 |         self.initialize_logger()
 66 |         self.initialize_memory()
 67 |         self.tool_retrival(tools)
 68 | 
 69 |     def initialize_logger(self):
 70 |         self.chain_logger = ChainMessageLogger(output_streams=[sys.stdout], lang=self.lang)
 71 |         self.cfg.set_chain_logger(self.chain_logger)
 72 | 
 73 |     def initialize_memory(self):
 74 |         pass
 75 |     
 76 |     def initialize_tokenizer(self, llm_name):
 77 |         if "baichuan" in llm_name:
 78 |             model_name = "kwaikeg/kagentlms_baichuan2_13b_mat"
 79 |         elif "qwen" in llm_name:
 80 |             model_name = "kwaikeg/kagentlms_qwen_7b_mat"
 81 |         else:
 82 |             model_name = "gpt2"
 83 |         tokenizer = AutoTokenizer.from_pretrained(
 84 |             model_name,
 85 |             use_fast=False,
 86 |             padding_side='left',
 87 |             trust_remote_code=True
 88 |         )
 89 |         return tokenizer
 90 | 
 91 |     def tool_retrival(self, tools):
 92 |         if tools:
 93 |             self.tools = [tool_cls(cfg=self.cfg) for tool_cls in tools]
 94 |         else:
 95 |             if "notool" in self.agent_profile.tools:
 96 |                 self.tools = list()
 97 |             else:
 98 |                 all_tools = [tool_cls(cfg=self.cfg) for tool_cls in ALL_TOOLS]
 99 | 
100 |                 if "auto" in self.agent_profile.tools:
101 |                     used_tools = [tool_cls(cfg=self.cfg) for tool_cls in ALL_TOOLS]
102 |                 else:
103 |                     used_tools = list()
104 |                     for tool in all_tools:
105 |                         if tool.zh_name in self.agent_profile.tools or tool.name in self.agent_profile.tools:
106 |                             used_tools.append(tool)
107 |                 used_tools += [tool_cls(cfg=self.cfg) for tool_cls in ALL_NO_TOOLS]
108 |             
109 |             self.tools = used_tools
110 |         self.name2tools = {t.name: t for t in self.tools}
111 | 
112 |     def memory_retrival(self, 
113 |         goal: str, 
114 |         conversation_history: List[List], 
115 |         complete_task_list: List[Dict]):
116 | 
117 |         memory = ""
118 |         if conversation_history:
119 |             memory += f"* Conversation History:\n"
120 |             for tmp in conversation_history[-3:]:
121 |                 memory += f"User: {tmp['query']}\nAssistant:{tmp['answer']}\n"
122 | 
123 |         if complete_task_list:
124 |             complete_task_str = json.dumps(complete_task_list, ensure_ascii=False, indent=4)
125 |             memory += f"* Complete tasks: {complete_task_str}\n"
126 |         return memory
127 | 
128 |     def task_plan(self, goal, memory):
129 |         prompt = make_planning_prompt(self.agent_profile, goal, self.tools, memory, self.cfg.max_tokens_num, self.tokenizer, lang=self.lang)
130 |         # print(f'\n************** TASK PLAN AGENT PROMPT *************')
131 |         # print(prompt)
132 |         try:
133 |             response, _ = create_chat_completion(
134 |             query=prompt, llm_model_name=self.cfg.smart_llm_model)
135 |             self.chain_logger.put_prompt_response(
136 |                 prompt=prompt, 
137 |                 response=response, 
138 |                 session_id=self.session_id, 
139 |                 mtype="auto_task_create",
140 |                 llm_name=self.cfg.smart_llm_model)
141 |             response = correct_json(find_json_dict(response))
142 |             task = json.loads(response)
143 |             new_tasks = [task]
144 |         except:
145 |             print(traceback.format_exc())
146 |             print("+" + response)
147 |             self.chain_logger.put("fail", logging_think_fail_msg(self.lang))
148 |             new_tasks = list()
149 |         
150 |         return new_tasks
151 | 
152 |     def tool_use(self, command) -> str:
153 |         try:
154 |             command_name = command.get("name", "")
155 |             if command_name == "search":
156 |                 command_name = "web_search"
157 |             args_text = ",".join([f'{key}={val}' for key, val in command["args"].items()])
158 |             execute_str = f'{command_name}({args_text})'.replace("wikipedia(", "kuaipedia(")
159 |             self.chain_logger.put("execute", execute_str)
160 |             if not command_name:
161 |                 raise RuntimeError("{} has no tool name".format(command))
162 |             if command_name not in self.name2tools:
163 |                 raise RuntimeError("has no tool named {}".format(command_name))
164 |             tool = self.name2tools[command_name]
165 | 
166 |             tool_output = tool(**command["args"])
167 |             self.chain_logger.put("observation", tool_output.answer_md)
168 | 
169 |             for prompt, response in tool_output.prompt_responses:
170 |                 self.chain_logger.put_prompt_response(
171 |                     prompt=prompt,
172 |                     response=response,
173 |                     session_id=self.session_id,
174 |                     mtype=f"auto_command_{command_name}",
175 |                     llm_name=self.cfg.fast_llm_model
176 |                 )
177 |             return tool_output.answer
178 |         except KeyboardInterrupt:
179 |             exit()
180 |         except:
181 |             print(traceback.format_exc())
182 |             self.chain_logger.put("observation", logging_execute_fail_msg(self.lang))
183 |             return ""
184 | 
185 |     def conclusion(self, 
186 |         goal: str, 
187 |         memory,
188 |         conversation_history: List[List],
189 |         no_task_planned: bool = False
190 |         ):
191 | 
192 |         if no_task_planned:
193 |             prompt = make_no_task_conclusion_prompt(goal, conversation_history)
194 |         else:
195 |             prompt = make_task_conclusion_prompt(self.agent_profile, goal, memory, self.cfg.max_tokens_num, self.tokenizer, lang=self.lang)
196 |         # print(f'\n************** CONCLUSION AGENT PROMPT *************')
197 |         # print(prompt)
198 | 
199 |         response, _ = create_chat_completion(
200 |             query=prompt, 
201 |             chat_id="kwaiagents_answer_" + self.session_id, 
202 |             llm_model_name=self.cfg.smart_llm_model)
203 | 
204 |         # print(response)
205 | 
206 |         self.chain_logger.put_prompt_response(
207 |             prompt=prompt, 
208 |             response=response, 
209 |             session_id=self.session_id, 
210 |             mtype="auto_conclusion",
211 |             llm_name=self.cfg.smart_llm_model)
212 |         return response
213 | 
214 |     def check_task_complete(self, task, iter_id):
215 |         command_name = task["command"]["name"]
216 |         if not task or ("task_name" not in task) or ("command" not in task) \
217 |             or ("args" not in task["command"]) or ("name" not in task["command"]):
218 |             self.chain_logger.put("finish", str(task.get("task_name", "")))
219 |             return True
220 |         elif command_name == FinishTool.name:
221 |             self.chain_logger.put("finish", str(task["command"]["args"].get("reason", "")))
222 |             return True
223 |         elif command_name == NoTool.name:
224 |             if iter_id == 1:
225 |                 self.chain_logger.put("finish", logging_do_not_need_use_tool_msg(self.lang))
226 |             else:
227 |                 self.chain_logger.put("finish", logging_do_not_need_use_tool_anymore_msg(self.lang))
228 |             return True
229 |         elif command_name not in self.name2tools:
230 |             self.chain_logger.put("finish", logging_do_not_need_use_tool_msg(self.lang))
231 |             return True
232 |         else:
233 |             return False
234 | 
235 |     def chat(self, query, history=list(), initial_task_name=None, *args, **kwargs):
236 |         goal = query
237 | 
238 |         if not self.tools:
239 |             no_task_planned = True
240 |         else:
241 |             tasks_storage = SingleTaskListStorage()
242 |             tasks_storage.clear()
243 | 
244 |             start = True
245 |             loop = True
246 |             iter_id = 0
247 |             complete_task_list = list()
248 |             no_task_planned = False
249 |             while loop:
250 |                 iter_id += 1
251 |                 if start or not tasks_storage.is_empty():
252 |                     start = False
253 |                     if not tasks_storage.is_empty():
254 |                         task = tasks_storage.popleft()
255 |                         
256 |                         if (self.check_task_complete(task, iter_id,)):
257 |                             if iter_id <= 2:
258 |                                 no_task_planned = True
259 |                             break
260 | 
261 |                         self.chain_logger.put("thought", task.get("task_name", ""))
262 | 
263 |                         result = self.tool_use(task["command"])
264 | 
265 |                         task["result"] = result
266 |                         complete_task_list.append(task)
267 | 
268 |                     if iter_id > self.agent_profile.max_iter_num:
269 |                         self.chain_logger.put("finish", logging_stop_thinking_msg(self.lang))
270 |                         break
271 |                     self.chain_logger.put("thinking")
272 |                     memory = self.memory_retrival(goal, history, complete_task_list)
273 |                     new_tasks = self.task_plan(goal, memory)
274 | 
275 |                     for new_task in new_tasks:
276 |                         new_task.update({"task_id": tasks_storage.next_task_id()})
277 |                         tasks_storage.append(new_task)
278 |                 else:
279 |                     loop = False
280 |                     self.chain_logger.put("finish", logging_finish_task_msg(self.lang))
281 | 
282 |         memory = self.memory_retrival(goal, history, complete_task_list)
283 |         self.chain_logger.put("conclusion", "")
284 | 
285 |         conclusion = self.conclusion(
286 |             goal, 
287 |             memory=memory,
288 |             conversation_history=history,
289 |             no_task_planned=no_task_planned)
290 |         self.chain_logger.put("chain_end", "")
291 | 
292 |         new_history = history[:] + [{"query": query, "answer": conclusion}]
293 | 
294 |         return {
295 |             "response": conclusion,
296 |             "history": new_history,
297 |             "chain_msg": self.chain_logger.chain_msgs,
298 |             "chain_msg_str": self.chain_logger.chain_msgs_str,
299 |             "more_info": {},
300 |         }
301 | 


--------------------------------------------------------------------------------
/kwaiagents/agents/prompts.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | 
  3 | from kwaiagents.utils.date_utils import get_current_time_and_date
  4 | from kwaiagents.utils.function_utils import transform_to_openai_function
  5 | 
  6 | 
  7 | planning_prompt_template = """
  8 | 你是{agent_name}，{agent_bio}
  9 | {agent_instructions}
 10 | 当前阶段是任务规划阶段，你将给定目标或问题，你的决策将独立执行而不依赖于人类的帮助，请发挥LLM的优势并且追求高效的策略进行任务规划。
 11 | 1.你有~4000字的短期记忆
 12 | 2.不需要用户的帮助
 13 | 3.规划的时候可以用参考工具中提到的工具
 14 | 4.互联网搜索、信息聚合和鉴别真伪的能力
 15 | 5.保持谦逊，对自己没把握的问题，尽可能调用command，但尽量少调用，不能重复调用
 16 | 6.当你从自身知识或者历史记忆中能得出结论，请聪明且高效，完成任务并得出结论
 17 | 7.经常建设性地自我批评整个行为大局，反思过去的决策和策略，以改进你的方法
 18 | 8.你最多只能进行{max_iter_num}步思考，规划{max_iter_num}个任务，所以尽可能高效规划任务
 19 | 9.你有反思能力，如果已完成的任务和结果暂不能得到回答问题所需信息或尚不能完成目标，应继续规划，但不能跟之前任务重复
 20 | 
 21 | {tool_specification}
 22 | 
 23 | {current_date_and_time}
 24 | 
 25 | {memory}
 26 | 
 27 | GOAL:{goal}
 28 | 
 29 | \n根据目标和已有任务，规划一个新Task(不能重复)，你只能以以下json列表的格式生成Task
 30 | {{
 31 |     "task_name": "任务描述",
 32 |     "command":{{
 33 |         "name":"command name",
 34 |         "args":{{
 35 |             "arg name":"value"
 36 |         }}
 37 |     }}
 38 | }}
 39 | 确保Task可以被Python的json.loads解析
 40 | 
 41 | 当已完成的Tasks已经能够帮助回答这个目标，则尽可能生成任务完成Task，否则生成一个其他Task。一个新Task:
 42 | """.strip()
 43 | 
 44 | planning_prompt_template_en = """
 45 | You are a {agent_name}，{agent_bio}
 46 | {agent_instructions}
 47 | Currently, you are in the task planning phase, where you will be given specific goals or problems to address. \
 48 | Your decisions will be executed independently without relying on human assistance. \
 49 | Please utilize LLM's advantages and pursue efficient strategies for task planning.\
 50 | 
 51 | 1. You have a short-term memory of approximately 4,000 characters.
 52 | 2. You do not require assistance from users.
 53 | 3. You can use the reference tools mentioned when planning.
 54 | 4. You have the abilities to perform internet searches, aggregate information, and discern between genuine and fake information.
 55 | 5. Remain humble and, if unsure about an issue, make use of commands when possible but minimize their usage and avoid repetition.
 56 | 6. When drawing conclusions from your knowledge or historical memory, be clever and efficient in task completion and conclusion.
 57 | 7. Regularly engage in constructive self-criticism to reflect on past decisions and strategies and improve your approach.
 58 | 8. You can think and plan up to {max_iter_num} steps, so strive to plan tasks as efficiently as possible.
 59 | 9. You have the capability for reflection; if a completed task and its results cannot provide the necessary information to answer a question or achieve a goal, continue planning but avoid repeating previous tasks.
 60 | 
 61 | {tool_specification}
 62 | 
 63 | {current_date_and_time}
 64 | 
 65 | {memory}
 66 | 
 67 | GOAL:{goal}
 68 | 
 69 | \nBased on the goal and existing tasks, plan a new Task (no repetitions), and you can only generate the Task in the following json list format:
 70 | {{
 71 |     "task_name": "task description",
 72 |     "command":{{
 73 |         "name":"command name",
 74 |         "args":{{
 75 |             "arg name":"value"
 76 |         }}
 77 |     }}
 78 | }}
 79 | Ensure that the Task can be parsed by Python's json.loads function. 
 80 | 
 81 | If the already completed Tasks are sufficient to answer the goal, then try to generate the Task to complete it as much as possible. Otherwise, create another Task. 
 82 | A new Task:
 83 | """.strip()
 84 | 
 85 | 
 86 | conclusion_prompt_template = """
 87 | 你是{agent_name}，{agent_bio}，{agent_instructions}
 88 | 当前阶段是总结阶段，在前几次交互中，对于用户给定的目标和问题，你已经通过自己搜寻出了一定信息，你需要整合这些信息用中文给出最终的结论。
 89 | 1. 搜寻的信息从很多工具中获取，会出现冗余
 90 | 2. 当不同工具获取的信息冲突的时候，你应该遵循一定的优先级(Wiki > search)去解决冲突
 91 | 
 92 | {current_date_and_time}
 93 | 
 94 | {memory}
 95 | 
 96 | 问题或目标：{goal}\n生成对用户有帮助的中文回答:
 97 | """
 98 | 
 99 | conclusion_prompt_template_en = """
100 | You are a {agent_name},{agent_bio},{agent_instructions}
101 | The current stage is the concluding stage. In the previous interactions, \
102 | you have already found some information by searching on your own for the user's given goals and problems. \
103 | You need to integrate this information and provide the final conclusion in Chinese.
104 | If there is information from Knowledge info, and the information can answer the question, \
105 | you can use the Knowledge info information as much as possible to answer the question without using external tool results or creating your own content.
106 | 1. The information you search for comes from many sources and may be redundant.
107 | 2. When the information obtained from different tools conflicts, you should follow a certain priority (Knowledge info > Wiki > search) to resolve the conflict.
108 | 
109 | {current_date_and_time}
110 | 
111 | {memory}
112 | 
113 | Goal: {goal}
114 | Generate helpful answers **in English** for users:
115 | """
116 | 
117 | 
118 | def make_planning_prompt(agent_profile, goal, used_tools, memory, max_tokens_num, tokenizer, lang="en"):
119 |     tool_spec = make_tool_specification(used_tools, lang)
120 |     template = planning_prompt_template if lang == "zh" else planning_prompt_template_en
121 |     prompt = template.format(**{
122 |         "agent_name": agent_profile.name,
123 |         "agent_bio": agent_profile.bio,
124 |         "agent_instructions": agent_profile.instructions,
125 |         "max_iter_num": agent_profile.max_iter_num,
126 |         "tool_specification": tool_spec,
127 |         "current_date_and_time": get_current_time_and_date(lang),
128 |         "memory": memory,
129 |         "goal": goal
130 |     })
131 |     prompt = prompt_truncate(tokenizer, prompt, memory, max_tokens_num)
132 |     return prompt
133 | 
134 | 
135 | def make_tool_specification(tools, lang="en"):
136 |     functions = [transform_to_openai_function(t) for t in tools]
137 | 
138 |     commands, cnt = [], 1
139 |     for f in functions:
140 |         func_str = json.dumps(f, ensure_ascii=False)
141 |         commands.append(f"{cnt}:{func_str}")
142 |         cnt += 1
143 | 
144 |     used_commands = "\n".join(commands)
145 | 
146 |     tool_spec = f'Commands:\n{used_commands}\n'
147 | 
148 |     return tool_spec
149 | 
150 | 
151 | def make_task_conclusion_prompt(agent_profile, goal, memory, max_tokens_num, tokenizer, lang="en"):
152 |     template = conclusion_prompt_template if lang == "zh" else conclusion_prompt_template_en
153 |     prompt = template.format(**{
154 |         "agent_name": agent_profile.name,
155 |         "agent_bio": agent_profile.bio,
156 |         "agent_instructions": agent_profile.instructions,
157 |         "current_date_and_time": get_current_time_and_date(lang),
158 |         "memory": memory,
159 |         "goal": goal
160 |     })
161 |     prompt = prompt_truncate(tokenizer, prompt, memory, max_tokens_num)
162 |     return prompt
163 | 
164 | 
165 | def make_no_task_conclusion_prompt(query, conversation_history=""):
166 |     prompt = ""
167 |     if conversation_history:
168 |         for tmp in conversation_history[-3:]:
169 |             prompt += f"User: {tmp['query']}\nAssistant:{tmp['answer']}\n"
170 |         prompt += f"User: {query}\nAssistant:"
171 |     else:
172 |         prompt = query
173 |     return prompt
174 | 
175 | 
176 | def prompt_truncate(tokenizer, prompt, memory, input_max_length):
177 |     kwargs = dict(add_special_tokens=False)
178 |     prompt_tokens = tokenizer.encode(prompt, **kwargs)
179 |     if len(prompt_tokens) > input_max_length:
180 |         if memory is None or memory not in prompt:
181 |             prompt_tokens = prompt_tokens[:input_max_length//2] + prompt_tokens[-input_max_length//2:]
182 |         else:
183 |             memory_prompt_tokens = tokenizer.encode(memory, add_special_tokens=False)
184 |             sublst_len = len(memory_prompt_tokens)
185 |             start_index = None
186 |             for i in range(len(prompt_tokens) - sublst_len + 1):
187 |                 if prompt_tokens[i:i+sublst_len] == memory_prompt_tokens:
188 |                     start_index = i
189 |                     break
190 |             
191 |             if start_index is None:
192 |                 prompt_tokens = prompt_tokens[:input_max_length//2] + prompt_tokens[-input_max_length//2:]
193 |             else:
194 |                 other_len = len(prompt_tokens) -  sublst_len
195 |                 if input_max_length > other_len:
196 |                     max_memory_len = input_max_length - other_len
197 |                     memory_prompt_tokens = memory_prompt_tokens[:max_memory_len//2] + memory_prompt_tokens[-max_memory_len//2:]
198 |                     prompt_tokens = prompt_tokens[:start_index] + memory_prompt_tokens + prompt_tokens[start_index + sublst_len:]
199 |     prompt = tokenizer.decode(prompt_tokens, skip_special_tokens=True)
200 |     return prompt


--------------------------------------------------------------------------------
/kwaiagents/config.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import json
 3 | from kwaiagents.utils.chain_logger import ChainMessageLogger
 4 | 
 5 | 
 6 | class Config(object):
 7 |     def __init__(self) -> None:
 8 |         """Initialize the Config class"""
 9 |         self.fast_llm_model = "gpt-3.5-turbo"
10 |         self.smart_llm_model = "gpt-4"
11 |         self.use_local_llm = False
12 |         self.local_llm_host = "localhost"
13 |         self.local_llm_port = 8888
14 |         self.browse_chunk_max_length = 4096
15 |         self.browse_summary_max_token = 300
16 |         self.selenium_web_browser = "chrome"
17 |         self.llm_max_retries = 5
18 |         self.temperature = 1.0
19 |         self.max_tokens_num = 4096
20 |         self.chain_logger = ChainMessageLogger()
21 | 
22 |     def __str__(self):
23 |         s = "============ CONFIG ============\n"
24 |         for key, val in self.__dict__.items():
25 |             s +=  "· " + key.upper() + ":\t" + str(val) + '\n'
26 |         return s
27 | 
28 |     def to_json_file(self, fname):
29 |         with open(fname, "w") as f:
30 |             json.dump({k:v for k, v in self.__dict__.items() if k not in ["chain_logger"]},f, ensure_ascii=False, indent=2)
31 | 
32 |     def set_chain_logger(self, chain_logger):
33 |         self.chain_logger = chain_logger
34 | 
35 | CFG = Config()


--------------------------------------------------------------------------------
/kwaiagents/llms/__init__.py:
--------------------------------------------------------------------------------
 1 | from __future__ import annotations
 2 | import time
 3 | import traceback
 4 | 
 5 | from kwaiagents.config import CFG
 6 | from kwaiagents.llms.clients import OpenAIClient, FastChatClient
 7 | 
 8 | 
 9 | def create_chat_completion(
10 |     query: str,
11 |     history: list[tuple[str, str]] = list(),
12 |     system: str = "",
13 |     llm_model_name: str = "gpt-3.5-turbo",
14 |     temperature: float = CFG.temperature,
15 |     max_tokens: int = None,
16 |     stop: str = "",
17 |     chat_id: str = None
18 | ) -> tuple[str, list[tuple[str, str]]]:
19 |     if CFG.use_local_llm:
20 |         llm_bot = FastChatClient(llm_model_name.lower(), host=CFG.local_llm_host, port=CFG.local_llm_port)
21 |     else:
22 |         llm_bot = OpenAIClient(llm_model_name.lower())
23 |     response = None
24 |     num_retries = CFG.llm_max_retries
25 |     for attempt in range(num_retries):
26 |         backoff = 2 ** (attempt + 2)
27 |         try:
28 |             response, new_history = llm_bot.chat(
29 |                 query=query,
30 |                 history=history,
31 |                 system=system,
32 |                 temperature=temperature,
33 |                 stop=stop,
34 |                 chat_id=chat_id
35 |             )
36 |             if response and "omitted content" not in response.lower():
37 |                 break
38 |             else:
39 |                 raise RuntimeError("GPT Chat return empty string, Retrying...")
40 |         except Exception as err:
41 |             print(err)
42 |         time.sleep(backoff)
43 |     if not response:
44 |         raise RuntimeError(f"Failed to get response after {num_retries} retries")
45 | 
46 |     return response, new_history


--------------------------------------------------------------------------------
/kwaiagents/llms/clients.py:
--------------------------------------------------------------------------------
  1 | import logging
  2 | import os
  3 | import requests
  4 | import sys
  5 | import time
  6 | import traceback
  7 | 
  8 | import openai
  9 | 
 10 | 
 11 | def make_gpt_messages(query, system, history):
 12 |     msgs = list()
 13 |     if system:
 14 |         msgs.append({
 15 |             "role": "system",
 16 |             "content": system
 17 |         })
 18 |     for q, a in history:
 19 |         msgs.append({
 20 |             "role": "user",
 21 |             "content": str(q)
 22 |         })
 23 |         msgs.append({
 24 |             "role": "assistant",
 25 |             "content": str(a)
 26 |         })
 27 |     msgs.append({
 28 |         "role": "user",
 29 |         "content": query
 30 |     })
 31 |     return msgs
 32 | 
 33 | 
 34 | class OpenAIClient(object):
 35 |     def __init__(self, model="gpt-3.5-turbo"):
 36 |         self.model = model
 37 |         openai.api_type = os.environ.get("OPENAI_API_TYPE", "open_ai")
 38 |         openai.api_key = os.environ["OPENAI_API_KEY"]
 39 |         if openai.api_type == "azure":
 40 |             openai.api_version = os.environ["OPENAI_API_VERSION"]
 41 |             openai.api_base = os.environ["OPENAI_API_BASE"]
 42 | 
 43 |     def chat(self, query, history=list(), system="", temperature=0.0, stop="", *args, **kwargs):
 44 |         msgs = make_gpt_messages(query, system, history)
 45 | 
 46 |         try:
 47 |             if openai.api_type == "open_ai":
 48 |                 response = openai.ChatCompletion.create(
 49 |                     model=self.model,
 50 |                     messages=msgs,
 51 |                     temperature = temperature,
 52 |                     stop=stop
 53 |                     )
 54 |             elif openai.api_type == "azure":
 55 |                 response = openai.ChatCompletion.create(
 56 |                     engine = self.model,
 57 |                     messages=msgs,
 58 |                     temperature = temperature,
 59 |                     stop=stop
 60 |                 )
 61 |             response_text = response['choices'][0]['message']['content']
 62 |         except:
 63 |             print(traceback.format_exc())
 64 |             response_text = ""
 65 | 
 66 |         new_history = history[:] + [[query, response_text]]
 67 |         return response_text, new_history
 68 | 
 69 | 
 70 | class FastChatClient(object):
 71 |     def __init__(self, model="kagentlms_baichuan2_13b_mat", host="localhost", port=8888):
 72 |         self.model = model
 73 |         self.host = host
 74 |         self.port = port
 75 | 
 76 |     def chat(self, query, history=list(), system="", temperature=0.0, stop="", *args, **kwargs):
 77 |         url = f'http://{self.host}:{self.port}/v1/completions/'
 78 | 
 79 |         headers = {"Content-Type": "application/json"}
 80 |         if "baichuan" in self.model:
 81 |             prompt = self.make_baichuan_prompt(query, system, history)
 82 |         elif "qwen" in self.model:
 83 |             prompt = self.make_qwen_prompt(query, system, history)
 84 |         else:
 85 |             prompt = self.make_prompt(query, system, history)
 86 |         data = {
 87 |             "model": self.model,
 88 |             "prompt": prompt,
 89 |             "temperature": 0.1,
 90 |             "top_p": 0.75,
 91 |             "top_k": 40,
 92 |             "max_tokens": 512
 93 |         }
 94 |         resp = requests.post(url=url, json=data, headers=headers)
 95 |         response = resp.json() # Check the JSON Response Content documentation below
 96 |         response_text = response['choices'][0]['text']
 97 | 
 98 |         new_history = history[:] + [[query, response_text]]
 99 |         return response_text, new_history
100 | 
101 |     @staticmethod
102 |     def make_prompt(query, system, history):
103 |         if not history:
104 |             history = list()
105 |         if system:
106 |             prompt = system + "\n"
107 |         else:
108 |             prompt = ''
109 |         for q, r in history:
110 |             prompt += 'User:' + q + '\nAssistant' + r + "\n"
111 |         prompt += query
112 |         return prompt
113 | 
114 |     @staticmethod
115 |     def make_baichuan_prompt(query, system, history):
116 |         if not history:
117 |             history = list()
118 |         if system:
119 |             prompt = system + "\n"
120 |         else:
121 |             prompt = ''
122 |         for q, r in history:
123 |             prompt += '<reserved_106>' + q + '<reserved_107>' + r 
124 |         prompt += query
125 |         return prompt
126 | 
127 |     @staticmethod
128 |     def make_qwen_prompt(query, system, history):
129 |         if not history:
130 |             history = list()
131 |         if system:
132 |             prompt = '<|im_start|>' + system + '<|im_end|>\n'
133 |         else:
134 |             prompt = ''
135 |         for q, r in history:
136 |             response = r if r else ''
137 |             prompt += '<|im_start|>user\n' + q + '<|im_end|>\n<|im_start|>assistant\n' + response + "<|im_end|>\n"
138 |         prompt += query
139 |         return prompt
140 | 


--------------------------------------------------------------------------------
/kwaiagents/tools/__init__.py:
--------------------------------------------------------------------------------
 1 | from .commons import NoTool, NoToolResult, FinishTool, FinishResult
 2 | from .search import SearchTool
 3 | from .browser import BrowserTool
 4 | from .weather import WeatherTool
 5 | from .calendars import CalendarTool
 6 | from .timedelta import TimeDeltaTool
 7 | from .solarterms import SolarTermsTool
 8 | 
 9 | 
10 | ALL_NO_TOOLS = [NoTool, FinishTool]
11 | ALL_AUTO_TOOLS = [SearchTool, BrowserTool, WeatherTool, CalendarTool, TimeDeltaTool, SolarTermsTool]
12 | ALL_TOOLS = [SearchTool, BrowserTool, WeatherTool, CalendarTool, TimeDeltaTool, SolarTermsTool]


--------------------------------------------------------------------------------
/kwaiagents/tools/base.py:
--------------------------------------------------------------------------------
 1 | import pprint
 2 | 
 3 | 
 4 | class BaseResult(object):
 5 |     def __init__(self, json_data):
 6 |         self.json_data = json_data
 7 | 
 8 |     def __str__(self):
 9 |         return pprint.pformat(self.json_data)
10 | 
11 |     @property
12 |     def answer(self):
13 |         return ""
14 | 
15 |     @property
16 |     def answer_md(self):
17 |         return self.answer
18 | 
19 |     @property
20 |     def urls(self):
21 |         return list()
22 | 
23 |     @property
24 |     def prompt_responses(self):
25 |         return list()
26 | 
27 | 
28 | class BaseTool(object):
29 |     def __init__(self, *args, **kwargs):
30 |         pass
31 | 
32 |     def __call__(self):
33 |         return BaseResult({})


--------------------------------------------------------------------------------
/kwaiagents/tools/browser.py:
--------------------------------------------------------------------------------
  1 | from __future__ import annotations
  2 | import logging
  3 | from pathlib import Path
  4 | 
  5 | from bs4 import BeautifulSoup
  6 | from selenium.webdriver.remote.webdriver import WebDriver
  7 | 
  8 | from kwaiagents.utils.html_utils import extract_hyperlinks, format_hyperlinks
  9 | import kwaiagents.utils.nlp_utils as summary
 10 | from kwaiagents.config import Config
 11 | from kwaiagents.tools.base import BaseTool, BaseResult
 12 | from kwaiagents.utils.selenium_utils import get_pagesource_with_selenium
 13 | 
 14 | FILE_DIR = Path(__file__).parent.parent
 15 | 
 16 | 
 17 | class BrowseResult(BaseResult):
 18 |     @property
 19 |     def answer(self):
 20 |         s = f"{self.json_data['summary']}"
 21 |         return s
 22 | 
 23 |     @property
 24 |     def prompt_responses(self):
 25 |         return self.json_data["prompt_responses"]
 26 | 
 27 | class BrowserTool(BaseTool):
 28 |     """
 29 |     Browse a specific website using the provided URL link. 
 30 |     Recommended to use URLs from `web_search` to avoid invalid links.
 31 | 
 32 |     Args:
 33 |         url (str): The website's URL link.
 34 |         question (str): The specific content or topic sought on the website.
 35 | 
 36 |     Returns:
 37 |         str: The webpage content.
 38 |     """
 39 |     name = "browse_website"
 40 |     zh_name = "网页浏览器"
 41 |     description = "Browse Website:\"browse_website\",args:\"url\":\"<url>, \"question\":\"<what_you_want_to_find_on_website>\""
 42 |     tips = "Browse a specific website using the provided URL link. Recommended to use URLs from `web_search` to avoid invalid links."
 43 | 
 44 |     def __init__(self, cfg=None, *args, **kwargs):
 45 |         self.cfg = cfg if cfg else Config()
 46 | 
 47 |     def __call__(self, url, question="",  *args, **kwargs):
 48 |         summary, urls, prompt_responses = browse_website(url, question, self.cfg)
 49 |         return BrowseResult({
 50 |             "summary": summary,
 51 |             "urls": urls,
 52 |             "prompt_responses": prompt_responses
 53 |         })
 54 | 
 55 | 
 56 | def browse_website(url: str, question: str, cfg: Config = None) -> tuple[str, WebDriver]:
 57 |     """Browse a website and return the answer and links to the user
 58 | 
 59 |     Args:
 60 |         url (str): The url of the website to browse
 61 |         question (str): The question asked by the user
 62 | 
 63 |     Returns:
 64 |         Tuple[str, WebDriver]: The answer and links to the user and the webdriver
 65 |     """
 66 |     if cfg:
 67 |         cfg.chain_logger.put("click", f"Access the website {url} ")
 68 |     driver, text = scrape_text_with_selenium(url, cfg)
 69 |     add_header(driver)
 70 |     summary_text, prompt_responses = summary.summarize_text(url, text, question, driver, cfg)
 71 |     links = scrape_links_with_selenium(driver, url)
 72 | 
 73 |     # Limit links to 5
 74 |     if len(links) > 5:
 75 |         links = links[:5]
 76 |     close_browser(driver)
 77 |     return summary_text, links, prompt_responses
 78 | 
 79 | def scrape_text_with_selenium(url: str, cfg: Config = None) -> tuple[WebDriver, str]:
 80 |     """Scrape text from a website using selenium
 81 | 
 82 |     Args:
 83 |         url (str): The url of the website to scrape
 84 | 
 85 |     Returns:
 86 |         Tuple[WebDriver, str]: The webdriver and the text scraped from the website
 87 |     """
 88 |     driver, page_source = get_pagesource_with_selenium(url, cfg.selenium_web_browser)
 89 |     soup = BeautifulSoup(page_source, "html.parser")
 90 |     for script in soup(["script", "style"]):
 91 |         script.extract()
 92 | 
 93 |     text = soup.get_text()
 94 |     lines = (line.strip() for line in text.splitlines())
 95 |     chunks = (phrase.strip() for line in lines for phrase in line.split("  "))
 96 |     text = "\n".join(chunk for chunk in chunks if chunk)
 97 |     return driver, text
 98 | 
 99 | 
100 | def scrape_links_with_selenium(driver: WebDriver, url: str) -> list[str]:
101 |     """Scrape links from a website using selenium
102 | 
103 |     Args:
104 |         driver (WebDriver): The webdriver to use to scrape the links
105 | 
106 |     Returns:
107 |         List[str]: The links scraped from the website
108 |     """
109 |     if not driver:
110 |         return list()
111 |     page_source = driver.page_source
112 |     soup = BeautifulSoup(page_source, "html.parser")
113 | 
114 |     for script in soup(["script", "style"]):
115 |         script.extract()
116 | 
117 |     hyperlinks = extract_hyperlinks(soup, url)
118 | 
119 |     return format_hyperlinks(hyperlinks)
120 | 
121 | 
122 | def close_browser(driver: WebDriver) -> None:
123 |     """Close the browser
124 | 
125 |     Args:
126 |         driver (WebDriver): The webdriver to close
127 | 
128 |     Returns:
129 |         None
130 |     """
131 |     if driver:
132 |         driver.quit()
133 | 
134 | 
135 | def add_header(driver: WebDriver) -> None:
136 |     """Add a header to the website
137 | 
138 |     Args:
139 |         driver (WebDriver): The webdriver to use to add the header
140 | 
141 |     Returns:
142 |         None
143 |     """
144 |     if driver:
145 |         driver.execute_script(open(f"{FILE_DIR}/js/overlay.js", "r").read())


--------------------------------------------------------------------------------
/kwaiagents/tools/calendars.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | # -*- coding: utf-8 -*-
  3 | # Author: PAN Leyi
  4 | # Email:  panleyi@kuaishou.com
  5 | 
  6 | 
  7 | import datetime
  8 | import math
  9 | import requests
 10 | 
 11 | from ephem import *
 12 | from lunar_python import Lunar, Solar
 13 | import pandas as pd
 14 | from kwaiagents.tools.base import BaseResult, BaseTool
 15 | from kwaiagents.utils.date_utils import get_date_list
 16 | 
 17 | 
 18 | class CalendarResult(BaseResult):
 19 |     @property
 20 |     def answer(self):
 21 |         if not self.json_data:
 22 |             return ""
 23 |         else:
 24 |             item = self.json_data
 25 |             rst = ""
 26 |             for main_key in item.keys():
 27 |                 if len(item[main_key]) != 0:
 28 |                     rst += f"{main_key}： \n"
 29 |                     keys = item[main_key][0].keys()
 30 |                     rst += ' | ' + ' | '.join(keys) + ' | ' + '\n'
 31 |                     for i in range(len(keys)):
 32 |                         rst += ' | ' + '---'
 33 |                     rst += ' |\n'
 34 | 
 35 |                     for row in item[main_key]:
 36 |                         rst += ' | ' + ' | '.join(row.values()) + ' | ' + '\n'
 37 |                 rst += "\n"
 38 |             return rst
 39 | 
 40 | 
 41 | class CalendarTool(BaseTool):
 42 |     """
 43 |     Retrieve calendar details between specified dates.
 44 |     Provide information on date, week day, solar term, zodiac, and holidays, but DO NOT provide the current time.
 45 | 
 46 |     Args:
 47 |         start_date (str): Start date in the format "yyyy-MM-dd".
 48 |         end_date (str): End date in the format "yyyy-MM-dd".
 49 | 
 50 |     Returns:
 51 |         str: Calendar details spanning from start date to end date.
 52 |     """
 53 |     name = "get_calendar_info"
 54 |     zh_name = "日历查询"
 55 |     description = 'Get calendar info:"get_calendar_info", args:"start_date":<str, "yyyy-MM-dd">, "end_date":<str, "yyyy-MM-dd">'
 56 |     tips = "get_calendar_info provide information on date, week day, solar term, zodiac, and holidays, but DO NOT provide the current time."
 57 | 
 58 |     def __init__(
 59 |         self,
 60 |         max_search_nums=5,
 61 |         lang="wt-wt",
 62 |         max_retry_times=5,
 63 |         *args,
 64 |         **kwargs,
 65 |     ):
 66 |         self.max_search_nums = max_search_nums
 67 |         self.max_retry_times = max_retry_times
 68 |         self.lang = lang
 69 | 
 70 |     def __call__(self, start_date, end_date, *args, **kwargs):
 71 | 
 72 |         date_list = get_date_list(start_date, end_date)
 73 | 
 74 |         huangli_str = []
 75 | 
 76 |         for date in date_list:
 77 |             l = date.split("-")
 78 |             c_y = int(l[0])
 79 |             c_m = int(l[1])
 80 |             c_d = int(l[2])
 81 |             d = Solar.fromYmd(c_y, c_m, c_d)
 82 |             lunar = d.getLunar()
 83 |             yinli = (
 84 |                 lunar.getYearInChinese()
 85 |                 + "年"
 86 |                 + lunar.getMonthInChinese()
 87 |                 + "月"
 88 |                 + lunar.getDayInChinese()
 89 |                 + " "
 90 |                 + lunar.getYearInGanZhi()
 91 |                 + "年"
 92 |             )
 93 |             yangli = (
 94 |                 str(d.getYear())
 95 |                 + "年"
 96 |                 + str(d.getMonth())
 97 |                 + "月"
 98 |                 + str(d.getDay())
 99 |                 + "日"
100 |                 + " 星期"
101 |                 + d.getWeekInChinese()
102 |             )
103 |             shengxiao = lunar.getYearShengXiao()
104 |             xingzuo = d.getXingZuo()
105 |             jieqi = lunar.getJieQi()
106 |             jieri = ""
107 |             l = lunar.getFestivals()
108 |             for s in l:
109 |                 jieri += s + " "
110 |             l = lunar.getOtherFestivals()
111 |             for s in l:
112 |                 jieri += s + " "
113 |             l = d.getFestivals()
114 |             for s in l:
115 |                 jieri += s + " "
116 |             l = d.getOtherFestivals()
117 |             for s in l:
118 |                 jieri += s + " "
119 | 
120 |             huangli_str.append({"阳历": yangli, "阴历": yinli, "生肖": shengxiao, "星座": xingzuo, "节气": jieqi, "节日": jieri})
121 | 
122 |         return CalendarResult(
123 |             {
124 |                 "待查日历信息": huangli_str,
125 |             }
126 |         )
127 | 


--------------------------------------------------------------------------------
/kwaiagents/tools/commons.py:
--------------------------------------------------------------------------------
 1 | from kwaiagents.tools.base import BaseResult, BaseTool
 2 | 
 3 | 
 4 | class NoToolResult(BaseResult):
 5 |     @property
 6 |     def answer(self):
 7 |         return ""
 8 | 
 9 | class NoTool(BaseTool):
10 |     """
11 |     Do nothing. Other functions are unsuitable due to inability to determine correct parameters from the query or no matching function exists.
12 | 
13 |     Args:
14 | 
15 |     Returns:
16 | 
17 |     """
18 |     name = "do_nothing"
19 |     zh_name = "不使用工具"
20 |     description = 'Do Nothing: "do_nothing",args:'
21 |     tips = ""
22 | 
23 |     def __call__(self):
24 |         return NoToolResult({})
25 | 
26 | class FinishResult(BaseResult):
27 |     @property
28 |     def answer(self):
29 |         return self.json_data["reason"]
30 | 
31 | class FinishTool(BaseTool):
32 |     """ 
33 |     Indicate task completion without the need for further functions. 
34 |     
35 |     Args:
36 | 
37 |     Returns:
38 | 
39 |     """
40 |     name = "task_complete"
41 |     zh_name = "任务完成"
42 |     description = 'Task Complete (Shutdown):"task_complete",args: "reason":"<reason-why-complete-but-not-response-the-objective>"'
43 |     tips = ""
44 | 
45 |     def __init__(self, *args, **kwargs):
46 |         pass
47 | 
48 |     def __call__(self, reason):
49 |         return FinishResult({
50 |             "reason": reason
51 |         })


--------------------------------------------------------------------------------
/kwaiagents/tools/search.py:
--------------------------------------------------------------------------------
  1 | from itertools import islice
  2 | import json
  3 | import os
  4 | import random
  5 | import traceback
  6 | from bs4 import BeautifulSoup as soup
  7 | from duckduckgo_search import DDGS
  8 | 
  9 | from kwaiagents.tools.base import BaseResult, BaseTool
 10 | from kwaiagents.utils.selenium_utils import get_pagesource_with_selenium
 11 | from kwaiagents.config import Config
 12 | 
 13 | 
 14 | class SearchResult(BaseResult):
 15 |     @property
 16 |     def answer(self):
 17 |         if not self.json_data:
 18 |             return ""
 19 |         else:
 20 |             rst = ""
 21 |             for item in self.json_data:
 22 |                 rst += f'title: {item["title"]}\nbody: {item["body"]}\nurl: {item["href"]}\n'
 23 |             return rst.strip()
 24 | 
 25 |     @property
 26 |     def answer_md(self):
 27 |         if not self.json_data:
 28 |             return ""
 29 |         else:
 30 |             return "\n" + "\n".join([f'{idx + 1}. <a href="{item["href"]}" target="_blank"><b>{item["title"]}</b></a>' + " | " + item["body"] 
 31 |                 for idx, item in enumerate(self.json_data)])
 32 | 
 33 |     @property
 34 |     def answer_full(self):
 35 |         if not self.json_data:
 36 |             return ""
 37 |         else:
 38 |             return json.dumps(self.json_data, ensure_ascii=False, indent=2)
 39 | 
 40 | 
 41 | class SearchTool(BaseTool):
 42 |     """
 43 |     Perform an internet search.
 44 | 
 45 |     Args:
 46 |         text (str): Search query.
 47 | 
 48 |     Returns:
 49 |         str: Multiple webpage links along with brief descriptions.
 50 |     """
 51 |     name = "web_search"
 52 |     zh_name = "网页搜索"
 53 |     description = "Web Search:\"web_search\",args:\"text\":\"<search>\""
 54 |     tips = ""
 55 |     
 56 |     def __init__(self, cfg=None, max_search_nums=5, lang="wt-wt", max_retry_times=5, *args, **kwargs):
 57 |         self.cfg = cfg if cfg else Config()
 58 |         self.max_search_nums = max_search_nums
 59 |         self.max_retry_times = max_retry_times
 60 |         self.lang = lang
 61 |         self.driver = None
 62 |         self.driver_cnt = 0
 63 | 
 64 |     def set_driver(self, driver):
 65 |         self.driver_cnt += 1
 66 |         if self.driver_cnt >= 20:
 67 |             self.driver_cnt = 0
 68 |             self.driver = None
 69 |         else:
 70 |             self.driver = driver
 71 |             
 72 |     def get_results_by_selenium(self, keyword):
 73 |         url = f"https://duckduckgo.com/?q={keyword}&t=h_&ia=web"
 74 |         driver, page_source = get_pagesource_with_selenium(url, "chrome", self.driver)
 75 |         self.set_driver(driver)
 76 |         page_soup = soup(page_source, "html.parser")
 77 |         articles = page_soup.find_all("article")
 78 | 
 79 |         results = list()
 80 |         for idx, article in enumerate(articles):
 81 |             if idx >= self.max_search_nums:
 82 |                 break
 83 |             href = article.find_all("a")[1]['href']
 84 |             title = article.find(class_="EKtkFWMYpwzMKOYr0GYm LQVY1Jpkk8nyJ6HBWKAk").text
 85 |             body = article.find(class_="OgdwYG6KE2qthn9XQWFC").text
 86 |             results.append({
 87 |                 "title": title,
 88 |                 "href": href,
 89 |                 "body": body
 90 |             })
 91 |         return results
 92 | 
 93 |     def get_results_by_ddg(self, keyword):
 94 |         search_results = list()
 95 | 
 96 |         my_proxy = os.getenv("http_proxy")
 97 |         with DDGS(proxies=my_proxy, timeout=20) as ddgs:
 98 |             ddgs_gen = ddgs.text(keyword, backend="api", region='sg-en', timelimit='y')
 99 |             for r in islice(ddgs_gen, self.max_search_nums):
100 |                 search_results.append(r)
101 |         return search_results
102 | 
103 |     def _retry_search_result(self, keyword, counter=0):
104 |         counter += 1
105 |         if counter > self.max_retry_times:
106 |             print("Search failed after %d retrying" % counter)
107 |             return [{
108 |                 "title": "Search Failed",
109 |                 "href": "",
110 |                 "body": ""
111 |             }]
112 |         try:
113 |             use_selenium = False
114 |             try:
115 |                 search_results = self.get_results_by_ddg(keyword)
116 |             except:
117 |                 print(traceback.format_exc())
118 |                 use_selenium = True
119 |             if not search_results and counter >= 2:
120 |                 use_selenium = True
121 |             if use_selenium:
122 |                 search_results = self.get_results_by_selenium(keyword)
123 |             if search_results and ("Google Patents" in search_results[0]["body"] or "patent" in search_results[0]["href"]):
124 |                 search_results = list()
125 |             if not search_results:
126 |                 return self._retry_search_result(keyword, counter)
127 |             return search_results
128 |         except:
129 |             print(traceback.format_exc())
130 |             print("Retry search...")
131 |             return self._retry_search_result(keyword, counter)
132 |         
133 |     def __call__(self, text):
134 |         return SearchResult(self._retry_search_result(text))


--------------------------------------------------------------------------------
/kwaiagents/tools/solarterms.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | # -*- coding: utf-8 -*-
  3 | # Author: PAN Leyi
  4 | # Email:  panleyi@kuaishou.com
  5 | 
  6 | 
  7 | from kwaiagents.tools.base import BaseResult, BaseTool
  8 | from datetime import datetime
  9 | from ephem import *
 10 | import math
 11 | 
 12 | solar_terms = ["小寒", "大寒", "立春", "雨水", "惊蛰", "春分", "清明", "谷雨", "立夏", "小满", "芒种",
 13 |     "夏至", "小暑", "大暑", "立秋", "处暑", "白露", "秋分", "寒露", "霜降", "立冬", "小雪", "大雪", "冬至"]
 14 | 
 15 | 
 16 | class SolarTermsResult(BaseResult):
 17 |     @property
 18 |     def answer(self):
 19 |         if not self.json_data:
 20 |             return ""
 21 |         else:
 22 |             item = self.json_data
 23 |             print(item)
 24 |             rst = ""
 25 |             for main_key in item.keys():
 26 |                 if len(item[main_key]) != 0:
 27 |                     rst += f"{main_key}： \n"
 28 |                     keys = item[main_key][0].keys()
 29 |                     rst += ' | ' + ' | '.join(keys) + ' | ' + '\n'
 30 |                     for i in range(len(keys)):
 31 |                         rst += ' | ' + '---'
 32 |                     rst += ' |\n'
 33 | 
 34 |                     for row in item[main_key]:
 35 |                         rst += ' | ' + ' | '.join(row.values()) + ' | ' + '\n'
 36 |                 rst += "\n"
 37 |             return rst
 38 | 
 39 | 
 40 | class SolarTermsTool(BaseTool):
 41 |     """
 42 |     Retrieve solar terms in Chinese for a given year. 
 43 | 
 44 |     Args:
 45 |         year (int): Target year for query.
 46 | 
 47 |     Returns:
 48 |         str: Solar terms information of the given year.
 49 |     """
 50 |     name = "get_solar_terms_info"
 51 |     zh_name = "查询节气日期"
 52 |     description = 'Get solar terms info:"get_solar_terms_info", args:"year": <int, required>'
 53 |     tips = "get_solar_terms_info retrieve solar terms in Chinese for a given year."
 54 | 
 55 |     def __init__(
 56 |         self,
 57 |         max_search_nums=5,
 58 |         lang="wt-wt",
 59 |         max_retry_times=5,
 60 |         *args,
 61 |         **kwargs,
 62 |     ):
 63 |         self.max_search_nums = max_search_nums
 64 |         self.max_retry_times = max_retry_times
 65 |         self.lang = lang
 66 | 
 67 |     def __call__(self, year, *args, **kwargs):
 68 |         # 计算黄经
 69 |         def ecliptic_lon(jd_utc):
 70 |             s = Sun(jd_utc)  # 构造太阳
 71 |             equ = Equatorial(
 72 |                 s.ra, s.dec, epoch=jd_utc
 73 |             )  # 求太阳的视赤经视赤纬（epoch设为所求时间就是视赤经视赤纬）
 74 |             e = Ecliptic(equ)  # 赤经赤纬转到黄经黄纬
 75 |             return e.lon  # 返回黄纬
 76 | 
 77 |         # 根据时间求太阳黄经，计算到了第几个节气，春分序号为0
 78 |         def sta(jd):
 79 |             e = ecliptic_lon(jd)
 80 |             n = int(e * 180.0 / math.pi / 15)
 81 |             return n
 82 | 
 83 |         # 根据当前时间，求下个节气的发生时间
 84 |         def iteration(jd, sta):  # jd：要求的开始时间，sta：不同的状态函数
 85 |             s1 = sta(jd)  # 初始状态(太阳处于什么位置)
 86 |             s0 = s1
 87 |             dt = 1.0  # 初始时间改变量设为1天
 88 |             while True:
 89 |                 jd += dt
 90 |                 s = sta(jd)
 91 |                 if s0 != s:
 92 |                     s0 = s
 93 |                     dt = -dt / 2  # 使时间改变量折半减小
 94 |                 if abs(dt) < 0.0000001 and s != s1:
 95 |                     break
 96 |             return jd
 97 |         
 98 |         res = []
 99 |         jd = Date(datetime(int(year), 1, 1, 0, 0, 0))
100 |         e = ecliptic_lon(jd)
101 |         for i in range(24):
102 |             jd = iteration(jd, sta)
103 |             d = Date(jd + 1 / 3).tuple()
104 |             res.append({"节气": solar_terms[i], "日期": "{0}-{1:02d}-{2:02d} {3:02d}:{4:02d}:{5:02d}".format(d[0], d[1], d[2], d[3], d[4], int(d[5]))})
105 | 
106 |         return SolarTermsResult({
107 |                 f"{year}年节气表": res
108 |             })
109 | 


--------------------------------------------------------------------------------
/kwaiagents/tools/timedelta.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- coding: utf-8 -*-
 3 | # Author: PAN Leyi
 4 | # Email:  panleyi@kuaishou.com
 5 | 
 6 | from datetime import datetime
 7 | from dateutil.relativedelta import relativedelta
 8 | 
 9 | from kwaiagents.config import Config
10 | from kwaiagents.tools.base import BaseResult, BaseTool
11 | 
12 | 
13 | class TimeDeltaResult(BaseResult):
14 |     @property
15 |     def answer(self):
16 |         item = self.json_data
17 |         rst = ""
18 |         for key in item.keys():
19 |             rst += f'{key}: {item[key]}\n'
20 |         return rst
21 | 
22 | 
23 | class TimeDeltaTool(BaseTool):
24 |     """
25 |     Calculate the time interval between two timestamps.
26 | 
27 |     Args:
28 |         start_time (str): format of "yyyy-MM-dd HH:mm:ss".
29 |         end_time (str): format of "yyyy-MM-dd HH:mm:ss".
30 | 
31 |     Returns:
32 |         str: The time delta between start time and end time.
33 |     """
34 |     name = "time_delta"
35 |     zh_name = "时间差工具"
36 |     description = 'time delta:"time_delta", args:"start_time":<str, "yyyy-MM-dd HH:mm:ss">, "end_time":<str, "yyyy-MM-dd HH:mm:ss">'
37 |     tips = "time_delta calculate the time interval between two timestamps."
38 | 
39 |     def __init__(
40 |         self,
41 |         max_search_nums=5,
42 |         lang="wt-wt",
43 |         max_retry_times=5,
44 |         *args,
45 |         **kwargs,
46 |     ):
47 |         self.max_search_nums = max_search_nums
48 |         self.max_retry_times = max_retry_times
49 |         self.lang = lang
50 | 
51 |     def __call__(self, start_time, end_time, *args, **kwargs):
52 |         # 长度为10，只有年月日
53 |         if len(start_time) == 10:
54 |             start_time += " 00:00:00"
55 |         if len(end_time) == 10:
56 |             end_time += " 00:00:00"
57 |         d1 = datetime.strptime(start_time[:19], '%Y-%m-%d %H:%M:%S')
58 |         d2 = datetime.strptime(end_time[:19], '%Y-%m-%d %H:%M:%S')
59 |         if d1 > d2:
60 |             t = d1
61 |             d1 = d2
62 |             d2 = t
63 |         delta = d2 - d1
64 |         delta_years = delta.days // 365
65 |         delta_months = (delta.days % 365) // 30
66 |         delta_days = (delta.days % 365) % 30
67 | 
68 |         return TimeDeltaResult(
69 |             {
70 |                 f"{d1}和{d2}距离相差": f"{delta}; {delta_years}年{delta_months}个月{delta_days}天"
71 |             }
72 |         )


--------------------------------------------------------------------------------
/kwaiagents/tools/weather.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | # -*- coding: utf-8 -*-
  3 | # Author: PAN Leyi
  4 | # Email:  panleyi@kuaishou.com
  5 | 
  6 | 
  7 | from itertools import islice
  8 | import json
  9 | import os
 10 | import random
 11 | import requests
 12 | import traceback
 13 | from translate import Translator
 14 | from datetime import datetime
 15 | 
 16 | from kwaiagents.config import Config
 17 | from kwaiagents.tools.base import BaseResult, BaseTool
 18 | from kwaiagents.utils.date_utils import get_date_list, fix_date_to_format
 19 | 
 20 | 
 21 | KEY = os.getenv("WEATHER_API_KEY")
 22 | URL_CURRENT_WEATHER = "http://api.weatherapi.com/v1/current.json"
 23 | URL_FORECAST_WEATHER = "http://api.weatherapi.com/v1/forecast.json"
 24 | URL_HISTORY_WEATHER = "http://api.weatherapi.com/v1/history.json"
 25 | 
 26 | 
 27 | def translate_text(text):
 28 |     translator = Translator(to_lang="Chinese")
 29 |     translation = translator.translate(text)
 30 |     return translation
 31 | 
 32 | 
 33 | class WeatherResult(BaseResult):
 34 |     @property
 35 |     def answer(self):
 36 |         if not self.json_data:
 37 |             return ""
 38 |         else:
 39 |             item = self.json_data
 40 |             print(item)
 41 |             if "error" in json.dumps(item):
 42 |                 if item["start_date"] == item["end_date"]:
 43 |                     return f'天气工具无法查询到{item["location"]}在{item["start_date"]}这一天天气，建议用网页搜索'
 44 |                 else:
 45 |                     return f'天气工具无法查询到{item["location"]}在{item["start_date"]}和{item["end_date"]}之间的天气，建议用网页搜索'
 46 |             rst = ""
 47 |             for main_key in item.keys():
 48 |                 if isinstance(item[main_key], str):
 49 |                     continue
 50 |                 if len(item[main_key]) != 0:
 51 |                     rst += f"{main_key}： \n"
 52 |                     keys = item[main_key][0].keys()
 53 |                     rst += ' | ' + ' | '.join(keys) + ' | ' + '\n'
 54 |                     for i in range(len(keys)):
 55 |                         rst += ' | ' + '---'
 56 |                     rst += ' |\n'
 57 | 
 58 |                     for row in item[main_key]:
 59 |                         rst += ' | ' + ' | '.join(row.values()) + ' | ' + '\n'
 60 |                 rst += "\n"
 61 |             return rst
 62 | 
 63 | 
 64 | class WeatherTool(BaseTool):
 65 |     """
 66 |     Retrieve weather information for specified locations and dates.
 67 | 
 68 |     Args:
 69 |         location (str): Locations in English separated by commas, e.g., "Beijing,Vancouver,...,Chicago".
 70 |         start_date (str): Start date in format "yyyy-MM-dd".
 71 |         end_date (str): End date in format "yyyy-MM-dd".
 72 |         is_current (str): "yes" or "no" indicating if current time's weather is desired.
 73 | 
 74 |     Returns:
 75 |         str: Weather information between start date and end date.
 76 |     """
 77 |     name = "get_weather_info"
 78 |     zh_name = "查询天气"
 79 |     description = 'Get weather info:"get_weather_info", args:"location": <location1,location2,...,in English,required>, "start_date":"<str: yyyy-MM-dd, required>", "end_date":"<str: yyyy-MM-dd, required>", "is_current":"<str, yes or no, required>"'
 80 |     tips = ""
 81 | 
 82 |     location_c2e ={
 83 |         # 中国主要省市
 84 |         "上海": "Shanghai",
 85 |         "云南": "Yunnan",
 86 |         "内蒙古": "Inner Mongolia",
 87 |         "北京": "Beijing",
 88 |         "台湾": "Taiwan",
 89 |         "吉林": "Jilin",
 90 |         "四川": "Sichuan",
 91 |         "天津": "Tianjin",
 92 |         "宁夏": "Ningxia",
 93 |         "安徽": "Anhui",
 94 |         "山东": "Shandong",
 95 |         "山西": "Shanxi",
 96 |         "广东": "Guangdong",
 97 |         "广西": "Guangxi",
 98 |         "新疆": "Xinjiang",
 99 |         "江苏": "Jiangsu",
100 |         "江西": "Jiangxi",
101 |         "河北": "Hebei",
102 |         "河南": "Henan",
103 |         "浙江": "Zhejiang",
104 |         "海南": "Hainan",
105 |         "湖北": "Hubei",
106 |         "湖南": "Hunan",
107 |         "澳门": "Macao",
108 |         "甘肃": "Gansu",
109 |         "福建": "Fujian",
110 |         "西藏": "Tibet",
111 |         "贵州": "Guizhou",
112 |         "辽宁": "Liaoning",
113 |         "重庆": "Chongqing",
114 |         "陕西": "Shaanxi",
115 |         "青海": "Qinhai",
116 |         "香港": "Hong Kong",
117 |         "黑龙江": "Heilongjiang",
118 |         "石家庄": "Shijiazhuang",
119 |         "太原": "Taiyuan",
120 |         "呼和浩特": "Huhehaote",
121 |         "沈阳": "Shenyang",
122 |         "长春": "Changchun",
123 |         "哈尔滨": "Haerbin",
124 |         "南京": "Nanjing",
125 |         "杭州": "Hangzhou",
126 |         "合肥": "Hefei",
127 |         "福州": "Fuzhou",
128 |         "济南": "Jinan",
129 |         "南昌": "Nanchang",
130 |         "郑州": "Zhengzhou",
131 |         "乌鲁木齐": "Urumqi",
132 |         "武汉": "Wuhan",
133 |         "长沙": "Changsha",
134 |         "广州": "Guangzhou",
135 |         "南宁": "Nanning",
136 |         "海口": "Haikou",
137 |         "成都": "Chengdu",
138 |         "贵阳": "Guiyang",
139 |         "昆明": "Kunming",
140 |         "拉萨": "Lasa",
141 |         "西安": "Xi'an",
142 |         "西宁": "Xining",
143 |         "兰州": "Lanzhou",
144 |         "银川": "Yinchuan",
145 |         "深圳": "Shenzhen",
146 |         "苏州": "Suzhou",
147 |         "东莞": "Dongwan",
148 |         "宁波": "Ningbo",
149 |         "佛山": "Foshan",
150 |         "青岛": "Qingdao",
151 |         "无锡": "Wuxi",
152 |         "厦门": "Xiamen",
153 |         "温州": "Wenzhou",
154 |         "金华": "Jinhua",
155 |         "大连": "Dalian",
156 |         "泉州": "Quanzhou",
157 |         "惠州": "Huizhou",
158 |         "常州": "Changzhou",
159 |         "嘉兴": "Jiaxing",
160 |         "徐州": "Xuzhou",
161 |         "南通": "Nantong",
162 |         "保定": "Baoding",
163 |         "珠海": "Zhuhai",
164 |         "中山": "Zhongshan",
165 |         "临沂": "Linyi",
166 |         "潍坊": "Weifang",
167 |         "烟台": "Yantai",
168 |         "绍兴": "Shaoxing",
169 |         "台州": "Taizhou",
170 |         "洛阳": "Luoyang",
171 |         "廊坊": "Langfang",
172 |         "汕头": "Shantou",
173 |         "湖州": "Huzhou",
174 |         "咸阳": "Xianyang",
175 |         "盐城": "Yancheng",
176 |         "济宁": "Jining",
177 |         "扬州": "Yangzhou",
178 |         "赣州": "Ganzhou",
179 |         "阜阳": "Fuyang",
180 |         "唐山": "Tangshan",
181 |         "镇江": "Zhenjiang",
182 |         "邯郸": "Handan",
183 |         "南阳": "Nanyang",
184 |         "桂林": "Guilin",
185 |         "泰州": "Taizhou",
186 |         "遵义": "Zunyi",
187 |         "江门": "Jiangmen",
188 |         "揭阳": "Jieyang",
189 |         "芜湖": "Wuhu",
190 |         "商丘": "Shangqiu",
191 |         "连云港": "Lianyunguang",
192 |         "新乡": "Xinxiang",
193 |         "淮安": "Huaian",
194 |         "淄博": "Zibo",
195 |         "绵阳": "Mianyang",
196 |         "菏泽": "Heze",
197 |         "漳州": "Zhangzhou",
198 |         "周口": "Zhoukou",
199 |         "沧州": "Cangzhou",
200 |         "信阳": "Xinyang",
201 |         "衡阳": "Hengyang",
202 |         "湛江": "Zhanjiang",
203 |         "三亚": "Sanya",
204 |         "上饶": "Shangrao",
205 |         "邢台": "Xingtai",
206 |         "莆田": "Putian",
207 |         "柳州": "Liuzhou",
208 |         "宿迁": "Suqian",
209 |         "九江": "Jiujiang",
210 |         "襄阳": "Xiangyang",
211 |         "驻马店": "Zhumadian",
212 |         "宜昌": "Yichang",
213 |         "岳阳": "Yueyang",
214 |         "肇庆": "Zhaoqing",
215 |         "滁州": "Chuzhou",
216 |         "威海": "Weihai",
217 |         "德州": "Dezhou",
218 |         "泰安": "Taian",
219 |         "安阳": "Anyang",
220 |         "荆州": "Jingzhou",
221 |         "运城": "Yuncheng",
222 |         "安庆": "Anqing",
223 |         "潮州": "Chaozhou",
224 |         "清远": "Qingyuan",
225 |         "开封": "Kaifeng",
226 |         "宿州": "Suzhou",
227 |         "株洲": "Zhuzhou",
228 |         "蚌埠": "Bengbu",
229 |         "许昌": "Xuchang",
230 |         "宁德": "Ningde",
231 |         "六安": "Liuan",
232 |         "宜春": "Yichun",
233 |         "聊城": "Liaocheng",
234 |         "渭南": "Weinan",
235 |         "宜宾": "Yibin",
236 |         "鞍山": "Anshan",
237 |         "南充": "Nanchong",
238 |         "秦皇岛": "Qinhuangdao",
239 |         "毫州": "Haozhou",
240 |         "常德": "Changde",
241 |         "晋中": "Jinzhong",
242 |         "孝感": "Xiaogan",
243 |         "丽水": "Lishui",
244 |         "平顶山": "Pingdingshan",
245 |         "黄冈": "Huanggang",
246 |         "龙岩": "Longyan",
247 |         "枣庄": "Zaozhuang",
248 |         "郴州": "Chenzhou",
249 |         "日照": "Rizhao",
250 |         "马鞍山": "Maanshan",
251 |         "衢州": "Quzhou",
252 |         "鄂尔多斯": "Ordos Barun Gar Domda",
253 |         "包头": "Baotou",
254 |         "邵阳": "Shaoyang",
255 |         "德阳": "Deyang",
256 |         "泸州": "Luzhou",
257 |         "临汾": "Linfen",
258 |         "南平": "Nanping",
259 |         "焦作": "Jiaozuo",
260 |         "宣城": "Xuancheng",
261 |         "毕节": "Bijie",
262 |         "淮南": "Huainan",
263 |         "黔南": "Qiannan",
264 |         "滨州": "Binzhou",
265 |         "黔东南": "Qiandongnan",
266 |         "茂名": "Maoming",
267 |         "三明": "Sanming",
268 |         "湘潭": "Xiangtan",
269 |         "梅州": "Meizhou",
270 |         "乐山": "Leshan",
271 |         "黄石": "Huangshi",
272 |         "韶关": "Shaoguan",
273 |         "衡水": "Hengshui",
274 |         "怀化": "Huaihua",
275 |         "张家口": "Zhangjiakou",
276 |         "永州": "Yongzhou",
277 |         "十堰": "Shiyan",
278 |         "曲靖": "Qujing",
279 |         "大庆": "Daqing",
280 |         "舟山": "Zhoushan",
281 |         "宝鸡": "Baoji",
282 |         "景德镇": "Jingdezhen",
283 |         "北海": "Beihai",
284 |         "娄底": "Loudi",
285 |         "汕尾": "Shanwei",
286 |         "锦州": "Jinzhou",
287 |         "咸宁": "Xianning",
288 |         "大同": "Datong",
289 |         "恩施": "Enshi",
290 |         "营口": "Yingkou",
291 |         "长治": "Changzhi",
292 |         "赤峰": "Chifeng",
293 |         "抚州": "Fuzhou",
294 |         "漯河": "Luohe",
295 |         "眉山": "Meishan",
296 |         "东营": "Dongying",
297 |         "铜仁": "Tongren",
298 |         "汉中": "Hanzhong",
299 |         "黄山": "Huangshan",
300 |         "阳江": "Yangjiang",
301 |         "大理": "Dali",
302 |         "盘锦": "Panjin",
303 |         "达州": "Dazhou",
304 |         "承德": "Chengde",
305 |         "红河": "Honghe",
306 |         "百色": "Baise",
307 |         "丹东": "Dandong",
308 |         "益阳": "Yiyang",
309 |         "濮阳": "Puyang",
310 |         "河源": "Heyuan",
311 |         "铜陵": "Tongling",
312 |         "鄂州": "Ezhou",
313 |         "内江": "Neijiang",
314 |         "梧州": "Wuzhou",
315 |         "淮北": "Huaibei",
316 |         "安顺": "Anshun",
317 |         "晋城": "Jincheng",
318 | 
319 |         # 外国主要城市
320 |         "夏威夷檀香山": "Honolulu",
321 |         "阿拉斯加安克雷奇": "Anchorage",
322 |         "温哥华": "Vancouver",
323 |         "旧金山": "San Francisco",
324 |         "西雅图": "Seattle",
325 |         "洛杉矶": "Los Angeles",
326 |         "阿克拉维克": "Aklavik",
327 |         "艾德蒙顿": "Edmonton",
328 |         "凰城": "Phoenix",
329 |         "丹佛": "Denver",
330 |         "墨西哥城": "Mexico City",
331 |         "温尼伯": "Winnipeg",
332 |         "休斯敦": "Houston",
333 |         "明尼亚波利斯": "Minneapolis",
334 |         "圣保罗": "St. Paul",
335 |         "新奥尔良": "New Orleans",
336 |         "芝加哥": "Chicago",
337 |         "蒙哥马利": "Montgomery",
338 |         "危地马拉": "Guatemala",
339 |         "圣萨尔瓦多": "San Salvador",
340 |         "特古西加尔巴": "Tegucigalpa",
341 |         "马那瓜": "Managua",
342 |         "哈瓦那": "Havana",
343 |         "印地安纳波利斯": "Indianapolis",
344 |         "亚特兰大": "Atlanta",
345 |         "底特律": "Detroit",
346 |         "华盛顿": "Washington DC",
347 |         "费城": "Philadelphia",
348 |         "多伦多": "Toronto",
349 |         "渥太华": "Ottawa",
350 |         "拿骚": "Nassau",
351 |         "利马": "Lima",
352 |         "金斯敦": "Kingston",
353 |         "波哥大": "Bogota",
354 |         "纽约": "New York",
355 |         "蒙特利尔": "Montreal",
356 |         "波士顿": "Boston",
357 |         "圣多明各": "Santo Domingo",
358 |         "拉帕兹": "La Paz",
359 |         "加拉加斯": "Caracas",
360 |         "圣胡安": "San Juan",
361 |         "哈里法克斯": "Halifax",
362 |         "圣地亚哥": "Santiago",
363 |         "亚松森": "Asuncion",
364 |         "布宜诺斯艾利斯": "Buenos Aires",
365 |         "蒙特维的亚": "Montevideo",
366 |         "巴西利亚": "Brasilia",
367 |         "圣保罗": "Sao Paulo",
368 |         "里约热内卢": "Rio de Janeiro",
369 |         "雷克雅未克": "Reykjavik",
370 |         "里斯本": "Lisbon",
371 |         "卡萨布兰卡": "Casablanca",
372 |         "都柏林": "Dublin",
373 |         "伦敦": "London",
374 |         "马德里": "Madrid",
375 |         "巴塞罗那": "Barcelona",
376 |         "巴黎": "Paris",
377 |         "拉各斯": "Lagos",
378 |         "阿尔及尔": "Algiers",
379 |         "布鲁塞尔": "Brussels",
380 |         "阿姆斯特丹": "Amsterdam",
381 |         "日内瓦": "Geneva",
382 |         "苏黎世": "Zurich",
383 |         "法兰克福": "Frankfurt",
384 |         "奥斯陆": "Oslo",
385 |         "哥本哈根": "Copenhagen",
386 |         "罗马": "Rome",
387 |         "柏林": "Berlin",
388 |         "布拉格": "Prague",
389 |         "萨格雷布": "Zagreb",
390 |         "维也纳": "Vienna",
391 |         "斯德哥尔摩": "Stockholm",
392 |         "布达佩斯": "Budapest",
393 |         "贝尔格莱德": "Belgrade",
394 |         "华沙": "Warsaw",
395 |         "开普敦": "Cape Town",
396 |         "索非亚": "Sofia",
397 |         "雅典城": "Athens",
398 |         "塔林": "Tallinn",
399 |         "赫尔辛基": "Helsinki",
400 |         "布加勒斯特": "Bucharest",
401 |         "明斯克": "Minsk",
402 |         "约翰尼斯堡": "Johannesburg",
403 |         "伊斯坦布尔": "Istanbul",
404 |         "基辅": "Kyiv",
405 |         "敖德萨": "Odesa",
406 |         "哈拉雷": "Harare",
407 |         "开罗": "Cairo",
408 |         "安卡拉": "Ankara",
409 |         "耶路撒冷": "Jerusalem",
410 |         "贝鲁特": "Beirut",
411 |         "安曼": "Amman",
412 |         "喀土穆": "Khartoum",
413 |         "内罗毕": "Nairobi",
414 |         "莫斯科": "Moscow",
415 |         "亚的斯亚贝巴": "Addis Ababa",
416 |         "巴格达": "Baghdad",
417 |         "亚丁": "Aden",
418 |         "利雅得": "Riyadh",
419 |         "安塔那那利佛": "Antananarivo",
420 |         "科威特城": "Kuwait City",
421 |         "德黑兰": "Tehran",
422 |         "阿布扎比": "Abu Dhabi",
423 |         "喀布尔": "Kabul",
424 |         "卡拉奇": "Karachi",
425 |         "塔什干": "Tashkent",
426 |         "伊斯兰堡": "Islamabad",
427 |         "拉合尔": "Lahore",
428 |         "孟买": "Mumbai",
429 |         "新德里": "New Delhi",
430 |         "柯尔喀塔": "Kolkata",
431 |         "加德满都": "Kathmandu",
432 |         "达卡": "Dhaka",
433 |         "仰光": "Yangon",
434 |         "金边": "Phnom Penh",
435 |         "曼谷": "Bangkok",
436 |         "河内": "Hanoi",
437 |         "雅加达": "Jakarta",
438 |         "吉隆坡": "Kuala Lumpur",
439 |         "新加坡": "Singapore",
440 |         "珀斯": "Perth",
441 |         "马尼拉": "Manila",
442 |         "首尔": "Seoul",
443 |         "东京": "Tokyo",
444 |         "达尔文": "Darwin",
445 |         "布里斯班": "Brisbane",
446 |         "墨尔本": "Melbourne",
447 |         "堪培拉": "Canberra",
448 |         "悉尼": "Sydney",
449 |         "亚特雷德": "Adelaide",
450 |         "堪察加" :"Kamchatka",
451 |         "阿纳德尔": "Anadyr",
452 |         "苏瓦": "Suva",
453 |         "惠灵顿": "Wellington",
454 |         "查塔姆群岛": "Chatham Island",
455 |         "圣诞岛": "Kiritimati",
456 |     }
457 | 
458 |     location_e2c = {}
459 | 
460 | 
461 |     def __init__(
462 |         self,
463 |         cfg=None,
464 |         max_search_nums=5,
465 |         lang="wt-wt",
466 |         max_retry_times=5,
467 |         *args,
468 |         **kwargs,
469 |     ):
470 |         self.cfg = cfg if cfg else Config()
471 |         self.max_search_nums = max_search_nums
472 |         self.max_retry_times = max_retry_times
473 |         self.lang = lang
474 |         for key in self.location_c2e:
475 |             value = self.location_c2e[key]
476 |             self.location_e2c[value] = key
477 |             self.location_e2c[value.lower()] = key 
478 | 
479 | 
480 |     def get_current_weather(self, location: str):
481 |         """Get current weather"""
482 |         if location == "default" or location == "Default" or location == "Default Country" or location == "default country":
483 |             location = "Beijing"
484 |         param = {"key": KEY, "q": location, "aqi": "yes"}
485 |         res_completion = requests.get(URL_CURRENT_WEATHER, params=param)
486 |         data = json.loads(res_completion.text.strip())
487 |         if "error" in data.keys():
488 |             return {"查询结果": "error"}
489 |         
490 |         # print(data["current"])
491 | 
492 |         output = {}
493 |         overall = translate_text(f"{data['current']['condition']['text']}")[0]
494 |         output["整体天气"] = f"{overall}"
495 |         if "temp_c" in data['current'] and data['current']['temp_c']:
496 |             output[
497 |                 "气温"
498 |             ] = f"{data['current']['temp_c']}(°C)"
499 |         if "precip_mm" in data['current'] and data['current']['precip_mm']:
500 |             output[
501 |                 "降雨量"
502 |             ] = f"{data['current']['precip_mm']}(mm)"
503 |         if "pressure_mb" in data['current'] and data['current']['pressure_mb']:
504 |             output["气压"] = f"{data['current']['pressure_mb']}(百帕)"
505 |         if "humidity" in data['current'] and data['current']['humidity']:
506 |             output["湿度"] = f"{data['current']['humidity']}"
507 |         if "feelslike_c" in data['current'] and data['current']['feelslike_c']:
508 |             output[
509 |                 "体感温度"
510 |             ] = f"{data['current']['feelslike_c']}(°C)"
511 |         if "vis_km" in data['current'] and data['current']['vis_km']:
512 |             output[
513 |                 "能见度"
514 |             ] = f"{data['current']['vis_km']}(km)"
515 |         if "air_quality" in data["current"] and data['current']['air_quality']:
516 |             output[
517 |                 "空气质量"
518 |             ] = f"pm2.5: {round(data['current']['air_quality']['pm2_5'], 2)}(μg/m3), pm10: {round(data['current']['air_quality']['pm10'], 2)}(μg/m3)"
519 | 
520 |         return output
521 | 
522 |     def forecast_weather(self, location: str, date: str):
523 |         """Forecast weather in the upcoming days."""
524 |         if location == "default" or location == "Default" or location == "Default Country" or location == "default country":
525 |             param = {"key": KEY, "q": "Beijing", "dt": date, "aqi": "yes"}
526 |         else:
527 |             param = {"key": KEY, "q": location, "dt": date, "aqi": "yes"}
528 |         res_completion = requests.get(URL_FORECAST_WEATHER, params=param)
529 |         res_completion = json.loads(res_completion.text.strip())
530 |         if "error" in res_completion.keys():
531 |             return {"查询结果": "error"}
532 |         
533 |         res_completion_item = res_completion["forecast"]["forecastday"][0]
534 |         output_dict = {}
535 |         for k, v in res_completion_item["day"].items():
536 |             output_dict[k] = v
537 |         for k, v in res_completion_item["astro"].items():
538 |             output_dict[k] = v
539 |         output = {}
540 |         output["日期"] = str(date)
541 |         overall = translate_text(f"{output_dict['condition']['text']}")[0]
542 |         output["整体天气"] = f"{overall}"
543 |         output[
544 |             "最高温度"
545 |         ] = f"{output_dict['maxtemp_c']}(°C)"
546 |         output[
547 |             "最低温度"
548 |         ] = f"{output_dict['mintemp_c']}(°C)"
549 |         output[
550 |             "平均温度"
551 |         ] = f"{output_dict['avgtemp_c']}(°C)"
552 |         output["降雨概率"] = f"{output_dict['daily_chance_of_rain']}"
553 |         output["降雪概率"] = f"{output_dict['daily_will_it_snow']}"
554 |         output[
555 |             "平均能见度"
556 |         ] = f"{output_dict['avgvis_km']}(km)"
557 |         output["平均湿度"] = f"{output_dict['avghumidity']}"
558 |         output["日出时间"] = f"{output_dict['sunrise']}"
559 |         output["日落时间"] = f"{output_dict['sunset']}"
560 |         if "air_quality" not in output_dict.keys() or len(output_dict["air_quality"].keys()) == 0:
561 |             output["空气质量"] = ""
562 |         else:
563 |             output[
564 |                 "空气质量"
565 |             ] = f"pm2.5: {round(output_dict['air_quality']['pm2_5'], 2)}(μg/m3), pm10: {round(output_dict['air_quality']['pm10'], 2)}(μg/m3)"
566 | 
567 |         return output
568 | 
569 |     def get_history_weather(self, location: str, date: str):
570 |         """Find weather of a past date."""
571 |         if location == "default" or location == "Default" or location == "Default Country" or location == "default country":
572 |             param = {"key": KEY, "q": "Beijing", "dt": date}
573 |         else:
574 |             param = {"key": KEY, "q": location, "dt": date}
575 |         
576 |         res_completion = requests.get(URL_HISTORY_WEATHER, params=param)
577 |         res_completion = json.loads(res_completion.text.strip())
578 |         if "error" in res_completion.keys():
579 |             return {"查询结果": "error"}
580 | 
581 |         res_completion = res_completion["forecast"]["forecastday"][0]
582 |         output_dict = {}
583 |         for k, v in res_completion["day"].items():
584 |             output_dict[k] = v
585 |         for k, v in res_completion["astro"].items():
586 |             output_dict[k] = v
587 | 
588 |         output = {}
589 |         output["日期"] = str(date)
590 |         overall = translate_text(f"{output_dict['condition']['text']}")[0]
591 |         output["整体天气"] = f"{overall}"
592 |         output[
593 |             "最高温度"
594 |         ] = f"{output_dict['maxtemp_c']}(°C)"
595 |         output[
596 |             "最低温度"
597 |         ] = f"{output_dict['mintemp_c']}(°C)"
598 |         output[
599 |             "平均温度"
600 |         ] = f"{output_dict['avgtemp_c']}(°C)"
601 |         output[
602 |             "降雨量"
603 |         ] = f"{output_dict['totalprecip_mm']}(mm)"
604 |         output[
605 |             "平均能见度"
606 |         ] = f"{output_dict['avgvis_km']}(km)"
607 |         output["平均湿度"] = f"{output_dict['avghumidity']}"
608 |         output["日出时间"] = f"{output_dict['sunrise']}"
609 |         output["日落时间"] = f"{output_dict['sunset']}"
610 | 
611 |         return output
612 | 
613 |     def get_weather(self, location, start_date, end_date, is_current):
614 |         start_date = fix_date_to_format(start_date)
615 |         end_date = fix_date_to_format(end_date)
616 |         if location == "default" or location == "Default" or location == "Default Country" or location == "default country":
617 |             location_c = "北京"
618 |         # elif location in self.location_e2c.keys():
619 |         #     location_c = self.location_e2c[location]
620 |         else:
621 |             location_c = self.location_e2c[location]
622 | 
623 |         final_dict = {}
624 |         
625 |         date_list = get_date_list(start_date, end_date)
626 | 
627 |         # 获取现在的时间
628 |         curr_date = str(datetime.now())[:10]
629 |         # 全都是history
630 |         if end_date <= curr_date:
631 |             res = []
632 |             for d in date_list:
633 |                 if d == curr_date:
634 |                     try:
635 |                         res.append(self.get_history_weather(location, d))
636 |                     except:
637 |                         res.append(self.forecast_weather(location, d))
638 |                 else:
639 |                     res.append(self.get_history_weather(location, d))
640 |                 
641 |             if start_date == end_date:
642 |                 final_dict[f"{location_c}{start_date}天气"] = res
643 |             else:
644 |                 final_dict[f"{location_c}{start_date}至{end_date}天气"] = res
645 | 
646 |         # 全都是forecast
647 |         elif start_date > curr_date:
648 |             res = []
649 |             i = 0
650 |             for d in date_list:
651 |                 if i >= 10:
652 |                     break
653 |                 res.append(self.forecast_weather(location, d))
654 |                 i += 1
655 |             if start_date == end_date:
656 |                 final_dict[f"{location_c}{start_date}天气预报"] = res
657 |             else:
658 |                 final_dict[f"{location_c}{start_date}至{end_date}天气预报"] = res
659 | 
660 |         else:
661 |             res = []
662 |             # 有的是history，有的是forecast
663 |             past_date_list = get_date_list(start_date, curr_date)
664 |             future_date_list = (get_date_list(curr_date, end_date))[1:]
665 |             for d in past_date_list:
666 |                 if d == curr_date:
667 |                     try:
668 |                         res.append(self.get_history_weather(location, d))
669 |                     except:
670 |                         res.append(self.forecast_weather(location, d))
671 |                 else:
672 |                     res.append(self.get_history_weather(location, d))
673 | 
674 |             if start_date == curr_date:
675 |                 final_dict[f"{location_c}{start_date}天气"] = res
676 |             else:
677 |                 final_dict[f"{location_c}{start_date}至{curr_date}天气"] = res
678 |             res = []
679 |             i = 0
680 |             for d in future_date_list:
681 |                 if i >= 10:
682 |                     break
683 |                 res.append(self.forecast_weather(location, d))
684 |                 i += 1
685 |             if future_date_list[0] == end_date:
686 |                 final_dict[f"{location_c}{end_date}天气预报"] = res
687 |             else:
688 |                 final_dict[f"{location_c}{future_date_list[0]}至{end_date}天气预报"] = res
689 | 
690 | 
691 |         if is_current == "yes":
692 | 
693 |             final_dict[f"此时此刻{location_c}天气"] = [self.get_current_weather(location)]
694 | 
695 |         return final_dict
696 | 
697 | 
698 |     def __call__(self, start_date, end_date, is_current="yes", location="Beijing", *args, **kwargs):
699 |         
700 |         final_res = {
701 |             "location": location,
702 |             "start_date": start_date,
703 |             "end_date": end_date
704 |         }
705 | 
706 |         # 如果还是给了多个地址
707 |         if ',' in location:
708 |             location_list = location.split(',')
709 |         elif '，' in location:
710 |             location_list = location.split('，')
711 |         else:
712 |             location_list = [location]
713 |         
714 |         for location_ in location_list:
715 |             location_ = location_.strip()
716 |             # 如果给的是中文，且在字典中，则查字典翻译
717 |             if location_ in self.location_c2e.keys():
718 |                 loc = self.location_c2e[location_]
719 |             # 如果给的是中文，且不在字典中，直接返回结果不存在
720 |             elif not (32 <= ord(location_[0]) <= 126):
721 |                 final_res['查询结果'] = 'error'
722 |                 return WeatherResult(final_res)
723 |             # 如果是英文，且在字典中，直接输进去
724 |             elif location_ in self.location_e2c.keys():
725 |                 loc = location_
726 |             # 如果是英文，且不在字典中，返回不存在
727 |             else:
728 |                 final_res['查询结果'] = 'error'
729 |                 return WeatherResult(final_res)
730 |             # print(loc)
731 |             
732 |             if is_current == "是":
733 |                 is_cur = "yes"
734 |             elif is_current == "否" or is_current == "不是":
735 |                 is_cur = "no"
736 |             else:
737 |                 is_cur = is_current
738 |             try:
739 |                 result = self.get_weather(
740 |                         loc, start_date, end_date, is_cur
741 |                     )
742 |                 final_res.update(result)
743 |             except:
744 |                 print(traceback.format_exc())
745 |                 final_res['查询结果'] = 'error'
746 | 
747 |         return WeatherResult(final_res)


--------------------------------------------------------------------------------
/kwaiagents/utils/chain_logger.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | import sys
  3 | import time
  4 | 
  5 | 
  6 | ACTION_TEXTS = {
  7 |     "search": "搜索:",
  8 |     "observation": "我发现:",
  9 |     "click": "点击:",
 10 |     "execute": "执行:",
 11 |     "thinking": "思考中...",
 12 |     "thought": "想法:",
 13 |     "reading": "阅读中...",
 14 |     "reason": "理由:",
 15 |     "finish": "结束",
 16 |     "conclusion": "总结中...",
 17 |     "fail": "失败",
 18 |     "chain_end": "",
 19 | }
 20 | 
 21 | ACTION_TEXTS_EN = {
 22 |     "search": "search:",
 23 |     "observation": "observation:",
 24 |     "click": "click:",
 25 |     "execute": "execute:",
 26 |     "thinking": "thinking...",
 27 |     "thought": "thought:",
 28 |     "reading": "reading...",
 29 |     "reason": "reason:",
 30 |     "finish": "finish",
 31 |     "conclusion": "concluding...",
 32 |     "fail": "fail",
 33 |     "chain_end": "",
 34 | }
 35 | 
 36 | ACTION_ICONS = {
 37 |     "search": "🔍",
 38 |     "click": "🖱️",
 39 |     "thinking": "🤔",
 40 |     "reason": "⭐️",
 41 |     "execute": "🚀",
 42 |     "thought": "💡",
 43 |     "reading": "📖",
 44 |     "finish": "✅",
 45 |     "observation": "🔭",
 46 |     "conclusion": "💬",
 47 |     "fail": "🤦",
 48 |     "chain_end": ""
 49 | }
 50 | 
 51 | COLORS = [
 52 |     "\033[91m\033[1m{}\033[0m\033[0m",
 53 |     "\033[92m\033[1m{}\033[0m\033[0m",
 54 |     "\033[93m\033[1m{}\033[0m\033[0m",
 55 |     "\033[94m\033[1m{}\033[0m\033[0m",
 56 |     "\033[95m\033[1m{}\033[0m\033[0m",
 57 |     "\033[96m\033[1m{}\033[0m\033[0m",
 58 |     "\033[97m\033[1m{}\033[0m\033[0m",
 59 |     "\033[98m\033[1m{}\033[0m\033[0m"
 60 | ] * 100
 61 | ACTION_COLORED_TEXTS = {
 62 |     key: COLORS[idx].format(val)
 63 |     for idx, (key, val) in enumerate(ACTION_TEXTS.items())
 64 | }
 65 | ACTION_COLORED_TEXTS_EN = {
 66 |     key: COLORS[idx].format(val)
 67 |     for idx, (key, val) in enumerate(ACTION_TEXTS_EN.items())
 68 | }
 69 | 
 70 | 
 71 | logging_think_fail_msg = lambda lang: "我思考失败了" if lang == "zh" else "my thinking procedure failed."
 72 | logging_execute_fail_msg = lambda lang: "执行失败了" if lang == "zh" else "my execution procedure failed."
 73 | logging_do_not_need_use_tool_msg = lambda lang: "我认为不需要使用工具" if lang == "zh" else "I don't think I need to use tools."
 74 | logging_do_not_need_use_tool_anymore_msg = lambda lang: "我认为不需要使用工具" if lang == "zh" else "I don't think I need to use tools anymore."
 75 | logging_stop_thinking_msg = lambda lang: "对不起，我思考的步数有限，现在做个总结" if lang == "zh" else "Sorry, my thinking steps are limited, now let's make a conclusion."
 76 | logging_finish_task_msg = lambda lang: "任务完成，得出结论" if lang == "zh" else "Task complete, let's make a conclusion."
 77 | 
 78 | class ChainMessageLogger(object):
 79 |     def __init__(self, output_streams=[sys.stdout], lang="en"):
 80 |         self.chain_msgs = list()
 81 |         self.chain_msgs_str = ""
 82 |         self.output_streams = output_streams
 83 |         self.llm_prompt_responses = list()
 84 |         self.last_time = time.time()
 85 |         self.lang = lang
 86 | 
 87 |     def __str__(self):
 88 |         s = "output stream list: {}".format([str(t) for t in self.output_streams])
 89 |         return s
 90 | 
 91 |     def cut_text_into_short(self, long_text: str):
 92 |         return long_text.strip()[:100]
 93 | 
 94 |     def put_prompt_response(self, prompt: str, response: str, session_id: str, mtype: str, llm_name: str):
 95 |         self.llm_prompt_responses.append({
 96 |             "prompt": prompt,
 97 |             "response": response,
 98 |             "session_id": session_id,
 99 |             "type": mtype,
100 |             "llm_name": llm_name
101 |         })
102 | 
103 |     def put(self, action: str, text: str = ""):
104 |         text = str(text)
105 |         chain_msg = {
106 |             "index": len(self.chain_msgs),
107 |             "action": action,
108 |             "text": text,
109 |             "short_text": self.cut_text_into_short(text),
110 |             "finish_time": time.time()
111 |         }
112 |         self.chain_msgs.append(chain_msg)
113 | 
114 |         action = chain_msg["action"]
115 |         icon = ACTION_ICONS[action]
116 | 
117 | 
118 |         if self.lang == "zh":
119 |             action_text = ACTION_TEXTS[action]
120 |             colored_action_text = ACTION_COLORED_TEXTS[action]
121 |         else:
122 |             action_text = ACTION_TEXTS_EN[action]
123 |             colored_action_text = ACTION_COLORED_TEXTS_EN[action]
124 | 
125 |         text = chain_msg["text"]
126 |         chain_string= f"{icon} {action_text} {text}\n"
127 |         duration = "{:.3f}s".format(chain_msg["finish_time"] - self.last_time)
128 |         self.last_time = chain_msg["finish_time"]
129 |         colored_chain_string = f"{icon} {colored_action_text} {text}\nexecution duration: {duration}\n"
130 | 
131 |         for os in self.output_streams:
132 |             os.write(colored_chain_string)
133 |         self.chain_msgs_str += chain_string
134 | 
135 |     def info(self, text: str):
136 |         text = "{}".format(text)
137 |         for os in self.output_streams:
138 |             os.write(text)
139 | 
140 |     def clear(self):
141 |         del self.chain_msgs
142 |         del self.llm_prompt_responses
143 |         self.chain_msgs = list()
144 |         self.chain_msgs_str = ""
145 |         self.llm_prompt_responses = list()


--------------------------------------------------------------------------------
/kwaiagents/utils/date_utils.py:
--------------------------------------------------------------------------------
  1 | from datetime import datetime
  2 | from lunar_python import Solar, Lunar
  3 | import pandas as pd
  4 | 
  5 | 
  6 | def fix_date_to_format(date, format="%Y-%M-%d"):
  7 |     d = pd.to_datetime(date, format=format)
  8 |     return d.strftime(format)
  9 | 
 10 | 
 11 | def get_date_list(start_date, end_date):
 12 |     date_list = []
 13 |     start_date_list = start_date.split("-")
 14 |     s_y = int(start_date_list[0])
 15 |     s_m = int(start_date_list[1])
 16 |     s_d = int(start_date_list[2])
 17 | 
 18 |     end_date_list = end_date.split("-")
 19 |     e_y = int(end_date_list[0])
 20 |     e_m = int(end_date_list[1])
 21 |     e_d = int(end_date_list[2])
 22 | 
 23 |     c_y = s_y
 24 |     c_m = s_m
 25 |     c_d = s_d
 26 | 
 27 |     days = 0
 28 | 
 29 |     flag = 0
 30 |     while days <= 100:
 31 |         if c_y == e_y and c_m == e_m and c_d == e_d:
 32 |             flag = 1
 33 |         
 34 |         date_list.append(str(c_y) + '-' + str("%02d" % c_m) + '-' + str("%02d" % c_d))
 35 | 
 36 |         # 获取指定年份每月有几天
 37 |         d = Solar.fromYmd(c_y, 1, 1)
 38 |         if d.isLeapYear():
 39 |             day_dict = {
 40 |                 1: 31,
 41 |                 2: 29,
 42 |                 3: 31,
 43 |                 4: 30,
 44 |                 5: 31,
 45 |                 6: 30,
 46 |                 7: 31,
 47 |                 8: 31,
 48 |                 9: 30,
 49 |                 10: 31,
 50 |                 11: 30,
 51 |                 12: 31,
 52 |             }
 53 |         else:
 54 |             day_dict = {
 55 |                 1: 31,
 56 |                 2: 28,
 57 |                 3: 31,
 58 |                 4: 30,
 59 |                 5: 31,
 60 |                 6: 30,
 61 |                 7: 31,
 62 |                 8: 31,
 63 |                 9: 30,
 64 |                 10: 31,
 65 |                 11: 30,
 66 |                 12: 31,
 67 |             }
 68 | 
 69 |         if c_d == day_dict[c_m]:  # 本月最后一天
 70 |             if c_m == 12:  # 12月
 71 |                 c_y += 1
 72 |                 c_m = 1
 73 |                 c_d = 1
 74 |             else:
 75 |                 c_m += 1
 76 |                 c_d = 1
 77 |         else:
 78 |             c_d += 1
 79 | 
 80 |         days += 1
 81 | 
 82 |         if flag == 1:
 83 |             break
 84 |     return date_list
 85 | 
 86 | 
 87 | def get_current_time_and_date(lang="en"):
 88 |     solar = Solar.fromDate(datetime.now())
 89 |     lunar = solar.getLunar()
 90 |     if lang == "zh":
 91 |         rst = f'''
 92 | 当前阳历日期和时间: {str(datetime.now())}
 93 | 当前星期: 星期{str(solar.getWeekInChinese())}
 94 | 当前农历日期: {str(lunar.toString())}
 95 | 当前时辰: {str(lunar.getTimeZhi())}时
 96 | '''.strip()
 97 |     else:
 98 |         rst = f'''
 99 | Current Gregorian date and time: {str(datetime.now())}
100 | Current day of the week: 星期{str(solar.getWeekInChinese())}
101 | Current lunar date: {str(lunar.toString())}
102 | Current Chinese time unit: {str(lunar.getTimeZhi())}时
103 | '''.strip()
104 |     return rst


--------------------------------------------------------------------------------
/kwaiagents/utils/function_utils.py:
--------------------------------------------------------------------------------
 1 | import docstring_parser
 2 | 
 3 | 
 4 | def transform_to_openai_function(func):
 5 |     parsed = docstring_parser.parse(func.__doc__)
 6 | 
 7 |     # Extract descriptions, args, and returns
 8 |     description = parsed.short_description
 9 | 
10 |     args = {}
11 |     for param in parsed.params:
12 |         args[param.arg_name] = {
13 |             "type": param.type_name,
14 |             "description": param.description
15 |         }
16 | 
17 |     returns = {
18 |         "description": parsed.returns.description if hasattr(parsed.returns, "returns") else "",
19 |         "type": parsed.returns.type_name if hasattr(parsed.returns, "type_name") else ""
20 |     }
21 | 
22 |     return {
23 |         "name": func.name if hasattr(func, "name") else func.__name__,
24 |         "description": description,
25 |         "parameters": {
26 |             "type": "object",
27 |             "properties": args
28 |         },
29 |         "returns": returns,
30 |         "required": list(args.keys())
31 |     }
32 | 


--------------------------------------------------------------------------------
/kwaiagents/utils/html_utils.py:
--------------------------------------------------------------------------------
 1 | """HTML processing functions"""
 2 | from __future__ import annotations
 3 | 
 4 | from requests.compat import urljoin
 5 | from bs4 import BeautifulSoup
 6 | 
 7 | 
 8 | def convert_bs_html_table_to_list(table):
 9 |     header = None
10 | 
11 |     # Extract header
12 |     if table.find("<th>"):
13 |         header = [th.text.strip() for th in table.find_all('th')]
14 | 
15 |     # Extract rows
16 |     rows = []
17 |     for row in table.find_all('tr'):
18 |         cells = row.find_all(['td', 'th'])
19 |         rows.append([cell.text.strip() for cell in cells])
20 | 
21 |     if header:
22 |         content_rows = rows
23 |     else:
24 |         header = rows[0]
25 |         content_rows = rows[1:]
26 |     return [header] + content_rows
27 | 
28 | 
29 | def convert_bs_html_table_to_markdown(table):
30 |     items = convert_bs_html_table_to_list(table)
31 |     header = items[0]
32 |     content_rows = items[1:]
33 |     # Convert to markdown
34 |     markdown = '| ' + ' | '.join(header) + ' |\n'
35 |     markdown += '| ' + ' | '.join(['---'] * len(header)) + ' |\n'
36 |     for row in content_rows:
37 |         markdown += '| ' + ' | '.join(row) + ' |\n'
38 | 
39 |     return markdown
40 | 
41 | 
42 | def convert_html_table_to_markdown(table_html):
43 |     soup = BeautifulSoup(table_html, 'html.parser')
44 |     table = soup.find('table')
45 |     
46 |     return convert_bs_html_table_to_markdown(table)
47 | 
48 | 
49 | 
50 | 
51 | def extract_hyperlinks(soup: BeautifulSoup, base_url: str) -> list[tuple[str, str]]:
52 |     """Extract hyperlinks from a BeautifulSoup object
53 | 
54 |     Args:
55 |         soup (BeautifulSoup): The BeautifulSoup object
56 |         base_url (str): The base URL
57 | 
58 |     Returns:
59 |         List[Tuple[str, str]]: The extracted hyperlinks
60 |     """
61 |     return [
62 |         (link.text, urljoin(base_url, link["href"]))
63 |         for link in soup.find_all("a", href=True)
64 |     ]
65 | 
66 | 
67 | def format_hyperlinks(hyperlinks: list[tuple[str, str]]) -> list[str]:
68 |     """Format hyperlinks to be displayed to the user
69 | 
70 |     Args:
71 |         hyperlinks (List[Tuple[str, str]]): The hyperlinks to format
72 | 
73 |     Returns:
74 |         List[str]: The formatted hyperlinks
75 |     """
76 |     return [f"{link_text} ({link_url})" for link_text, link_url in hyperlinks]
77 | 


--------------------------------------------------------------------------------
/kwaiagents/utils/json_fix_general.py:
--------------------------------------------------------------------------------
  1 | """This module contains functions to fix JSON strings using general programmatic approaches, suitable for addressing
  2 | common JSON formatting issues."""
  3 | from __future__ import annotations
  4 | 
  5 | import contextlib
  6 | import json
  7 | import re
  8 | from typing import Optional
  9 | 
 10 |     
 11 | def find_json_list(input_str):
 12 |     try:
 13 |         st = input_str.index("[")
 14 |         end = input_str.rindex("]")
 15 |         return input_str[st:end + 1]
 16 |     except:
 17 |         return input_str
 18 | 
 19 | 
 20 | def find_json_dict(input_str, cnt=0):
 21 |     if input_str.count("{") > input_str.count("}"):
 22 |         return find_json_dict(input_str.rstrip("\n") + "\n}", cnt + 1)
 23 |     if cnt >= 5:
 24 |         return input_str
 25 |     try:
 26 |         st = input_str.index("{")
 27 |         end_str = '}\n}'
 28 |         end = input_str.rindex(end_str)
 29 |         return input_str[st:end + len(end_str)].strip()
 30 |     except json.decoder.JSONDecodeError:
 31 |         return find_json_dict(input_str.rstrip("\n") + "\n}", cnt + 1)
 32 |     except:
 33 |         return input_str
 34 | 
 35 | 
 36 | def extract_char_position(error_message: str) -> int:
 37 |     """Extract the character position from the JSONDecodeError message.
 38 | 
 39 |     Args:
 40 |         error_message (str): The error message from the JSONDecodeError
 41 |           exception.
 42 | 
 43 |     Returns:
 44 |         int: The character position.
 45 |     """
 46 | 
 47 |     char_pattern = re.compile(r"\(char (\d+)\)")
 48 |     if match := char_pattern.search(error_message):
 49 |         return int(match[1])
 50 |     else:
 51 |         raise ValueError("Character position not found in the error message.")
 52 | 
 53 | 
 54 | def fix_invalid_escape(json_to_load: str, error_message: str) -> str:
 55 |     """Fix invalid escape sequences in JSON strings.
 56 | 
 57 |     Args:
 58 |         json_to_load (str): The JSON string.
 59 |         error_message (str): The error message from the JSONDecodeError
 60 |           exception.
 61 | 
 62 |     Returns:
 63 |         str: The JSON string with invalid escape sequences fixed.
 64 |     """
 65 |     while error_message.startswith("Invalid \\escape"):
 66 |         bad_escape_location = extract_char_position(error_message)
 67 |         json_to_load = (
 68 |             json_to_load[:bad_escape_location] + json_to_load[bad_escape_location + 1 :]
 69 |         )
 70 |         try:
 71 |             json.loads(json_to_load)
 72 |             return json_to_load
 73 |         except json.JSONDecodeError as e:
 74 |             print("json loads error - fix invalid escape", e)
 75 |             error_message = str(e)
 76 |     return json_to_load
 77 | 
 78 | 
 79 | def balance_braces(json_string: str) -> Optional[str]:
 80 |     """
 81 |     Balance the braces in a JSON string.
 82 | 
 83 |     Args:
 84 |         json_string (str): The JSON string.
 85 | 
 86 |     Returns:
 87 |         str: The JSON string with braces balanced.
 88 |     """
 89 | 
 90 |     open_braces_count = json_string.count("{")
 91 |     close_braces_count = json_string.count("}")
 92 | 
 93 |     while open_braces_count > close_braces_count:
 94 |         json_string += "}"
 95 |         close_braces_count += 1
 96 | 
 97 |     while close_braces_count > open_braces_count:
 98 |         json_string = json_string.rstrip("}")
 99 |         close_braces_count -= 1
100 | 
101 |     with contextlib.suppress(json.JSONDecodeError):
102 |         json.loads(json_string)
103 |         return json_string
104 | 
105 | 
106 | def add_quotes_to_property_names(json_string: str) -> str:
107 |     """
108 |     Add quotes to property names in a JSON string.
109 | 
110 |     Args:
111 |         json_string (str): The JSON string.
112 | 
113 |     Returns:
114 |         str: The JSON string with quotes added to property names.
115 |     """
116 | 
117 |     def replace_func(match: re.Match) -> str:
118 |         return f'"{match[1]}":'
119 | 
120 |     property_name_pattern = re.compile(r"(\w+):")
121 |     corrected_json_string = property_name_pattern.sub(replace_func, json_string)
122 | 
123 |     try:
124 |         json.loads(corrected_json_string)
125 |         return corrected_json_string
126 |     except json.JSONDecodeError as e:
127 |         raise e
128 | 
129 | 
130 | def correct_json(json_to_load: str) -> str:
131 |     """
132 |     Correct common JSON errors.
133 |     Args:
134 |         json_to_load (str): The JSON string.
135 |     """
136 | 
137 |     try:
138 |         json.loads(json_to_load)
139 |         return json_to_load
140 |     except json.JSONDecodeError as e:
141 |         print("json loads error", e)
142 |         error_message = str(e)
143 |         if error_message.startswith("Invalid \\escape"):
144 |             json_to_load = fix_invalid_escape(json_to_load, error_message)
145 |         if error_message.startswith(
146 |             "Expecting property name enclosed in double quotes"
147 |         ):
148 |             json_to_load = add_quotes_to_property_names(json_to_load)
149 |             try:
150 |                 json.loads(json_to_load)
151 |                 return json_to_load
152 |             except json.JSONDecodeError as e:
153 |                 print("json loads error - add quotes", e)
154 |                 error_message = str(e)
155 |         if balanced_str := balance_braces(json_to_load):
156 |             return balanced_str
157 |     return json_to_load


--------------------------------------------------------------------------------
/kwaiagents/utils/nlp_utils.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | import re
  3 | """Text processing functions"""
  4 | from typing import Generator, Optional, Dict
  5 | from selenium.webdriver.remote.webdriver import WebDriver
  6 | from kwaiagents.config import Config
  7 | from kwaiagents.llms import create_chat_completion
  8 | 
  9 | 
 10 | def split_sentences(text, lang='en'):
 11 |     if not text:
 12 |         return []
 13 |     if lang == 'en':
 14 |         # Split English sentences using regular expression
 15 |         sentences = re.split(r'(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\?)\s', text)
 16 |     elif lang.startswith('zh'):
 17 |         # Split Chinese sentences using regular expression
 18 |         sentences = re.split(r'(?<=[。！？])\s*', text)
 19 |     else:
 20 |         raise ValueError("Unsupported language. Please use 'en' for English or 'zh' for Chinese.")
 21 | 
 22 |     # Remove any empty strings from the list
 23 |     sentences = [s.strip() for s in sentences if s.strip()]
 24 | 
 25 |     return sentences
 26 | 
 27 | 
 28 | def split_text(text: str, max_length: int = 4096) -> Generator[str, None, None]:
 29 |     """Split text into chunks of a maximum length
 30 | 
 31 |     Args:
 32 |         text (str): The text to split
 33 |         max_length (int, optional): The maximum length of each chunk. Defaults to 8192.
 34 | 
 35 |     Yields:
 36 |         str: The next chunk of text
 37 | 
 38 |     Raises:
 39 |         ValueError: If the text is longer than the maximum length
 40 |     """
 41 |     paragraphs = text.split("\n")
 42 |     current_length = 0
 43 |     current_chunk = []
 44 | 
 45 |     for paragraph in paragraphs:
 46 |         if current_length + len(paragraph) + 1 <= max_length:
 47 |             current_chunk.append(paragraph)
 48 |             current_length += len(paragraph) + 1
 49 |         else:
 50 |             yield "\n".join(current_chunk)
 51 |             current_chunk = [paragraph]
 52 |             current_length = len(paragraph) + 1
 53 | 
 54 |     if current_chunk:
 55 |         yield "\n".join(current_chunk)
 56 | 
 57 | 
 58 | def summarize_text(
 59 |     url: str, text: str, question: str, driver: Optional[WebDriver] = None, cfg: Config = None
 60 | ) -> str:
 61 |     """Summarize text using the OpenAI API
 62 | 
 63 |     Args:
 64 |         url (str): The url of the text
 65 |         text (str): The text to summarize
 66 |         question (str): The question to ask the model
 67 |         driver (WebDriver): The webdriver to use to scroll the page
 68 |         cfg (Config): The config of the global agent
 69 | 
 70 |     Returns:
 71 |         str: The summary of the text
 72 |     """
 73 |     if not text:
 74 |         return "Error: No text to summarize", []
 75 | 
 76 |     text_length = len(text)
 77 |     cfg.chain_logger.put("reading", f"共 {text_length} 字需要阅读")
 78 | 
 79 |     summaries = []
 80 |     chunks = list(split_text(text, cfg.browse_chunk_max_length))
 81 |     scroll_ratio = 1 / len(chunks)
 82 | 
 83 |     prompt_responses = list()
 84 | 
 85 |     if cfg.fast_llm_model in ["llama"] and len(chunks) > 1:
 86 |         batch_size = 3
 87 |         cnt = 0
 88 |         for i in range(len(chunks) // batch_size + 1):
 89 |             if driver:
 90 |                 scroll_to_percentage(driver, scroll_ratio * i)
 91 |             batch_chunk = chunks[i * batch_size: (i + 1) * batch_size]
 92 |             if not batch_chunk:
 93 |                 break
 94 |             batch = [
 95 |                 create_message(chunk, question)
 96 |                 for chunk in batch_chunk
 97 |             ]
 98 |             batch_summaries, _ = create_chat_completion(
 99 |                     query=batch,
100 |                     llm_model_name=cfg.fast_llm_model,
101 |                     max_tokens=cfg.browse_summary_max_token,
102 |                 )
103 |             if isinstance(batch_summaries, str):
104 |                 batch_summaries = json.loads(batch_summaries)
105 |             summaries.extend(batch_summaries)
106 | 
107 |             cnt += len(batch)
108 |             cfg.chain_logger.put("reading", f"{cnt} / {len(chunks)} 个段落")
109 |     else:
110 |         for i, chunk in enumerate(chunks):
111 |             if driver:
112 |                 scroll_to_percentage(driver, scroll_ratio * i)
113 |             # print(f"Adding chunk {i + 1} / {len(chunks)} to memory")
114 | 
115 |             # memory_to_add = f"Source: {url}\n" f"Raw content part#{i + 1}: {chunk}"
116 | 
117 |             # MEMORY.add(memory_to_add)
118 | 
119 | 
120 |             cfg.chain_logger.put("reading", f"第 {i + 1} / {len(chunks)} 个段落")
121 |             message = create_message(chunk, question)
122 | 
123 |             try:
124 |                 summary, _ = create_chat_completion(
125 |                     query=message,
126 |                     llm_model_name=cfg.fast_llm_model,
127 |                     max_tokens=cfg.browse_summary_max_token,
128 |                 )
129 |             except:
130 |                 summary = ""
131 |             summaries.append(summary)
132 |             
133 |             prompt_responses.append((message, summary))
134 |         # print(f"Added chunk {i + 1} summary to memory")
135 | 
136 |         # memory_to_add = f"Source: {url}\n" f"Content summary part#{i + 1}: {summary}"
137 | 
138 |         # MEMORY.add(memory_to_add)
139 |     print(len(summaries))
140 |     if len(summaries) == 1:
141 |         return summary, prompt_responses
142 |     if len(summaries) == 0:
143 |         return "", prompt_responses
144 |     cfg.chain_logger.put("reading", f"总结这 {len(chunks)} 个段落")
145 |     print(f"Summarized {len(chunks)} chunks.")
146 | 
147 |     combined_summary = "\n".join(summaries)
148 |     message = create_message(combined_summary, question)
149 | 
150 |     summary, _ = create_chat_completion(
151 |             query=message,
152 |             llm_model_name=cfg.fast_llm_model,
153 |             max_tokens=cfg.browse_summary_max_token,
154 |         )
155 |     prompt_responses.append((message, summary))
156 | 
157 |     return summary, prompt_responses
158 | 
159 | 
160 | def scroll_to_percentage(driver: WebDriver, ratio: float) -> None:
161 |     """Scroll to a percentage of the page
162 | 
163 |     Args:
164 |         driver (WebDriver): The webdriver to use
165 |         ratio (float): The percentage to scroll to
166 | 
167 |     Raises:
168 |         ValueError: If the ratio is not between 0 and 1
169 |     """
170 |     if ratio < 0 or ratio > 1:
171 |         raise ValueError("Percentage should be between 0 and 1")
172 |     driver.execute_script(f"window.scrollTo(0, document.body.scrollHeight * {ratio});")
173 | 
174 | 
175 | def create_message(chunk: str, question: str) -> Dict[str, str]:
176 |     """Create a message for the chat completion
177 | 
178 |     Args:
179 |         chunk (str): The chunk of text to summarize
180 |         question (str): The question to answer
181 | 
182 |     Returns:
183 |         Dict[str, str]: The message to send to the chat completion
184 |     """
185 |     return f'"""{chunk}""" 基于上述文本回答下面的问题 ' +\
186 |         f'问题: "{question}" -- 假如无法回答这个问题，则总结上述文本：'
187 | 
188 | 
189 | if __name__ == "__main__":
190 |     # Example usage
191 |     text_en = "This is an example sentence. Here's another one! And a third?"
192 |     text_zh = "这是一个示例句子。这是另一个！还有第三个？"
193 | 
194 |     sentences_en = split_sentences(text_en, lang='en')
195 |     sentences_zh = split_sentences(text_zh, lang='zh')
196 | 
197 |     print(sentences_en)
198 |     print(sentences_zh)


--------------------------------------------------------------------------------
/kwaiagents/utils/selenium_utils.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | 
 3 | from selenium import webdriver
 4 | from selenium.webdriver.remote.webdriver import WebDriver
 5 | from selenium.webdriver.common.by import By
 6 | from selenium.webdriver.support.wait import WebDriverWait
 7 | from selenium.webdriver.support import expected_conditions as EC
 8 | from selenium.webdriver.chrome.options import Options as ChromeOptions
 9 | from selenium.webdriver.firefox.options import Options as FirefoxOptions
10 | from selenium.webdriver.safari.options import Options as SafariOptions
11 | from webdriver_manager.chrome import ChromeDriverManager
12 | from webdriver_manager.firefox import GeckoDriverManager
13 | import logging
14 | 
15 | import time
16 | 
17 | 
18 | def get_web_driver(selenium_web_browser):
19 |     options_available = {
20 |         "chrome": ChromeOptions,
21 |         "safari": SafariOptions,
22 |         "firefox": FirefoxOptions,
23 |     }
24 | 
25 |     options = options_available[selenium_web_browser]()
26 |     options.add_argument(
27 |         "user-agent=Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/112.0.5615.49 Safari/537.36"
28 |     )
29 |     
30 |     if selenium_web_browser == "firefox":
31 |         current_driver = webdriver.Firefox(
32 |             executable_path=GeckoDriverManager().install(), options=options
33 |         )
34 |     elif selenium_web_browser == "safari":
35 |         # Requires a bit more setup on the users end
36 |         # See https://developer.apple.com/documentation/webkit/testing_with_webdriver_in_safari
37 |         current_driver = webdriver.Safari(options=options)
38 |     else:
39 |         options.add_argument('--no-sandbox')
40 |         options.add_argument('--disable-dev-shm-usage')
41 |         options.add_argument('--headless')
42 |         proxy = os.getenv("http_proxy")
43 |         if proxy:
44 |             options.add_argument(f'--proxy-server={proxy}')
45 |         current_driver = webdriver.Chrome(options=options)
46 |     return current_driver
47 | 
48 | 
49 | def get_pagesource_with_selenium(url: str, selenium_web_browser:str, driver: WebDriver = None) -> str:
50 |     logging.getLogger("selenium").setLevel(logging.CRITICAL)
51 |     driver = get_web_driver(selenium_web_browser)
52 |     if driver is None:
53 |         driver = get_web_driver(selenium_web_browser)
54 |     
55 |     driver.get(url)
56 | 
57 |     WebDriverWait(driver, 10).until(
58 |         EC.presence_of_element_located((By.TAG_NAME, "body"))
59 |     )
60 | 
61 |     # Get the HTML content directly from the browser's DOM
62 |     page_source = driver.execute_script("return document.body.outerHTML;")
63 |     return driver, page_source


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | bs4
 2 | pandas
 3 | docstring_parser
 4 | lunar_python==1.3.2
 5 | duckduckgo-search>=4.2
 6 | selenium==4.1.4
 7 | webdriver-manager==3.8.6
 8 | openai==0.27.8
 9 | translate==3.6.1
10 | ephem==4.1.4
11 | transformers>=4.33.2
12 | tiktoken
13 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | import io
 3 | from setuptools import setup, find_packages
 4 | 
 5 | 
 6 | with open('README.md') as f:
 7 |     readme = f.read()
 8 | 
 9 | with open('requirements.txt') as f:
10 |     requirements = f.read()
11 | 
12 | setup(
13 |     # Metadata
14 |     name='kwaiagents',
15 |     version='0.0.1',
16 |     python_requires='>=2.7,>=3.6',
17 |     author='Haojie Pan',
18 |     author_email='panhaojie@kuaishou.com',
19 |     description='Kwaiagents',
20 |     long_description=readme,
21 |     long_description_content_type='text/markdown',
22 |     entry_points = {
23 |         'console_scripts': [
24 |             'kagentsys=kwaiagents.agent_start:main']
25 |     },
26 |     packages=find_packages(),
27 |     license='Attribution-NonCommercial-ShareAlike 4.0',
28 | 
29 |     # Package info
30 |     install_requires=requirements
31 | )
32 | 


--------------------------------------------------------------------------------