\n", 1040 | " | inputs.question | \n", 1041 | "outputs.response | \n", 1042 | "error | \n", 1043 | "reference.response | \n", 1044 | "feedback.final_answer_correct | \n", 1045 | "execution_time | \n", 1046 | "example_id | \n", 1047 | "id | \n", 1048 | "
---|---|---|---|---|---|---|---|---|
0 | \n", 1053 | "I want a full refund for invoice 237 | \n", 1054 | "You have been refunded a total of: $0.99. Is t... | \n", 1055 | "None | \n", 1056 | "You have been refunded $0.99. | \n", 1057 | "True | \n", 1058 | "3.750356 | \n", 1059 | "b094b32b-94f6-49a4-9af7-a7ccb289cba5 | \n", 1060 | "2ab8e132-e3b0-4ffe-ba73-3d42aea64fda | \n", 1061 | "
1 | \n", 1064 | "My name is Aaron Mitchell and I'd like a refun... | \n", 1065 | "We did not find any purchases associated with ... | \n", 1066 | "None | \n", 1067 | "Which of the following purchases would you lik... | \n", 1068 | "False | \n", 1069 | "3.748979 | \n", 1070 | "2274dab9-5682-4e35-8f30-e3171886b2a9 | \n", 1071 | "c9d3bb87-0ec2-4557-b384-cbf038e18149 | \n", 1072 | "
2 | \n", 1075 | "My name is Aaron Mitchell and I'd like a refund. | \n", 1076 | "Please provide your phone number and either th... | \n", 1077 | "None | \n", 1078 | "I need some more information to help you with ... | \n", 1079 | "True | \n", 1080 | "3.108677 | \n", 1081 | "16e7f941-7c18-4152-82fe-639ce4feca0e | \n", 1082 | "35d9a6f6-dbb7-445f-a214-a12af1d495b0 | \n", 1083 | "
3 | \n", 1086 | "How many songs do you have by James Brown | \n", 1087 | "There are 20 James Brown songs in the database... | \n", 1088 | "None | \n", 1089 | "We have 20 songs by James Brown | \n", 1090 | "True | \n", 1091 | "6.446163 | \n", 1092 | "5a516727-b97f-40ea-a363-605a8b92669a | \n", 1093 | "21d7d353-accd-43f0-9776-56cffb8a3954 | \n", 1094 | "
4 | \n", 1097 | "Who recorded Wish You Were Here again? | \n", 1098 | "I apologize, but I'm not finding \"Wish You Wer... | \n", 1099 | "None | \n", 1100 | "Wish You Were Here is an album by Pink Floyd | \n", 1101 | "False | \n", 1102 | "10.356575 | \n", 1103 | "27e113d9-498f-49ab-a66b-8395a4a6b32b | \n", 1104 | "c476f0a7-b2f5-4628-8e59-c6eb2a4acf4d | \n", 1105 | "
\n", 1304 | " | inputs.messages | \n", 1305 | "outputs.route | \n", 1306 | "error | \n", 1307 | "reference.route | \n", 1308 | "feedback.correct | \n", 1309 | "execution_time | \n", 1310 | "example_id | \n", 1311 | "id | \n", 1312 | "
---|---|---|---|---|---|---|---|---|
0 | \n", 1317 | "[{'role': 'user', 'content': 'Can I get my mon... | \n", 1318 | "refund_agent | \n", 1319 | "None | \n", 1320 | "refund_agent | \n", 1321 | "True | \n", 1322 | "0.634425 | \n", 1323 | "47bb4665-da6f-4b58-a314-fefc886040c3 | \n", 1324 | "f6ccda12-147a-41ad-8e3c-93da544b6ca5 | \n", 1325 | "
1 | \n", 1328 | "[{'role': 'user', 'content': 'i purchased a co... | \n", 1329 | "question_answering_agent | \n", 1330 | "None | \n", 1331 | "question_answering_agent | \n", 1332 | "True | \n", 1333 | "0.412655 | \n", 1334 | "e88b4749-4b72-42d0-9efd-e69ff276b4e2 | \n", 1335 | "47fb6f5c-0d54-4757-b3df-ba2d271d1cf3 | \n", 1336 | "
2 | \n", 1339 | "[{'role': 'user', 'content': 'i want a refund ... | \n", 1340 | "question_answering_agent | \n", 1341 | "None | \n", 1342 | "question_answering_agent | \n", 1343 | "True | \n", 1344 | "0.409138 | \n", 1345 | "0dc9df85-806c-477c-ba2e-b1872b445db9 | \n", 1346 | "aacd798d-9afb-4b84-ab67-e2ec1c3adb22 | \n", 1347 | "
3 | \n", 1350 | "[{'role': 'user', 'content': 'I was thinking o... | \n", 1351 | "question_answering_agent | \n", 1352 | "None | \n", 1353 | "question_answering_agent | \n", 1354 | "True | \n", 1355 | "0.410535 | \n", 1356 | "cd503c74-547a-41fb-8763-ed808dcf9ba9 | \n", 1357 | "7770076c-0894-460f-a7ec-ed53ae491cf4 | \n", 1358 | "
4 | \n", 1361 | "[{'role': 'user', 'content': 'i bought some tr... | \n", 1362 | "refund_agent | \n", 1363 | "None | \n", 1364 | "refund_agent | \n", 1365 | "True | \n", 1366 | "0.342001 | \n", 1367 | "ac23df0a-f0d7-442f-b85d-26e62126adce | \n", 1368 | "b227ce5d-5378-4195-ab76-3d52f1db1b2a | \n", 1369 | "
\n", 1619 | " | inputs.question | \n", 1620 | "outputs.trajectory | \n", 1621 | "error | \n", 1622 | "reference.trajectory | \n", 1623 | "feedback.extra_steps | \n", 1624 | "feedback.unmatched_steps | \n", 1625 | "execution_time | \n", 1626 | "example_id | \n", 1627 | "id | \n", 1628 | "
---|---|---|---|---|---|---|---|---|---|
0 | \n", 1633 | "My name is Aaron Mitchell and I'd like a refund. | \n", 1634 | "[intent_classifier, refund_agent, gather_info,... | \n", 1635 | "None | \n", 1636 | "[intent_classifier, refund_agent, gather_info,... | \n", 1637 | "0 | \n", 1638 | "0 | \n", 1639 | "2.993548 | \n", 1640 | "0f9e2190-ef0f-455e-86e1-f3965fe2dd20 | \n", 1641 | "70f63270-7d0e-49f4-9e25-873ce8725324 | \n", 1642 | "
1 | \n", 1645 | "My name is Aaron Mitchell. My number is +1 (20... | \n", 1646 | "[intent_classifier, refund_agent, gather_info,... | \n", 1647 | "None | \n", 1648 | "[intent_classifier, refund_agent, gather_info,... | \n", 1649 | "0 | \n", 1650 | "0 | \n", 1651 | "3.585207 | \n", 1652 | "f7573d70-d3c9-4273-bad8-96c1693d41e6 | \n", 1653 | "7e2b5eaf-3af9-475b-978b-c84167d9c3d8 | \n", 1654 | "
2 | \n", 1657 | "My name is Aaron Mitchell and I'd like a refun... | \n", 1658 | "[intent_classifier, refund_agent, gather_info,... | \n", 1659 | "None | \n", 1660 | "[intent_classifier, refund_agent, gather_info,... | \n", 1661 | "0 | \n", 1662 | "0 | \n", 1663 | "3.596975 | \n", 1664 | "6c35522a-a1ca-4212-9edf-5c17566cfb05 | \n", 1665 | "a748f4a7-bd7e-40b2-af6e-e9de37e56000 | \n", 1666 | "
3 | \n", 1669 | "How many songs do you have by James Brown | \n", 1670 | "[intent_classifier, question_answering_agent, ... | \n", 1671 | "None | \n", 1672 | "[intent_classifier, question_answering_agent, ... | \n", 1673 | "0 | \n", 1674 | "0 | \n", 1675 | "7.249661 | \n", 1676 | "1c308dca-8a5e-44d8-9620-d71c36a06852 | \n", 1677 | "45055ce2-bb55-475c-918f-3e69aaaecc40 | \n", 1678 | "
4 | \n", 1681 | "Who recorded Wish You Were Here again? What ot... | \n", 1682 | "[intent_classifier, question_answering_agent, ... | \n", 1683 | "None | \n", 1684 | "[intent_classifier, question_answering_agent, ... | \n", 1685 | "3 | \n", 1686 | "3 | \n", 1687 | "19.679824 | \n", 1688 | "14b71f30-6e70-4ea4-b527-3fdca46de008 | \n", 1689 | "b416ff67-b582-402b-9161-3503f9bc5d87 | \n", 1690 | "