{"id":1795,"date":"2024-04-03T01:50:47","date_gmt":"2024-04-02T17:50:47","guid":{"rendered":"https:\/\/www.tchepai.com\/?p=1795"},"modified":"2024-08-18T09:00:12","modified_gmt":"2024-08-18T01:00:12","slug":"react","status":"publish","type":"post","link":"https:\/\/www.kdjingpai.com\/ja\/react\/","title":{"rendered":"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c"},"content":{"rendered":"<p>\u539f\u6587\uff1ahttps:\/\/arxiv.org\/pdf\/2210.03629.pdf<\/p>\n<p>\u770b\u5b8c\u4e5f\u65e0\u6cd5\u7406\u89e3ReAct\u5982\u4f55\u8fd0\u4f5c\u548c\u5e94\u7528\uff1f\u8bf7\u770b\u300a<a href=\"https:\/\/www.kdjingpai.com\/react-2\/\">ReAct\u5b9e\u73b0\u903b\u8f91\u5b9e\u64cd<\/a>\u300b\uff0c\u7528\u5b9e\u9645\u6848\u4f8b\u8fdb\u884c\u8bb2\u89e3\u3002<\/p>\n<p>&nbsp;<\/p>\n<h2>\u6458\u8981<\/h2>\n<p>&nbsp;<\/p>\n<p>\u867d\u7136\u5927\u578b\u8bed\u8a00\u6a21\u578b(llm)\u5728\u8bed\u8a00\u7406\u89e3\u548c\u4ea4\u4e92\u5f0f\u51b3\u7b56\u7684\u4efb\u52a1\u4e2d\u8868\u73b0\u51fa\u4ee4\u4eba\u5370\u8c61\u6df1\u523b\u7684\u6027\u80fd\uff0c\u4f46\u5b83\u4eec\u7684\u63a8\u7406\u80fd\u529b(\u5982\u601d\u7ef4\u94fe\u63d0\u793a)\u548c\u884c\u52a8\u80fd\u529b(\u5982\u884c\u52a8\u8ba1\u5212\u751f\u6210)\u4e3b\u8981\u662f\u4f5c\u4e3a\u5355\u72ec\u7684\u4e3b\u9898\u8fdb\u884c\u7814\u7a76\u3002\u672c\u6587\u63a2\u7d22\u4e86\u4f7f\u7528llm\u4ee5\u4ea4\u9519\u7684\u65b9\u5f0f\u751f\u6210\u63a8\u7406\u8f68\u8ff9\u548c\u7279\u5b9a\u4efb\u52a1\u7684\u884c\u52a8\uff0c\u5141\u8bb8\u4e24\u8005\u4e4b\u95f4\u4ea7\u751f\u66f4\u5927\u7684\u534f\u540c\u4f5c\u7528:\u63a8\u7406\u8f68\u8ff9\u5e2e\u52a9\u6a21\u578b\u5f52\u7eb3\u3001\u8ddf\u8e2a\u548c\u66f4\u65b0\u884c\u52a8\u8ba1\u5212\uff0c\u4ee5\u53ca\u5904\u7406\u5f02\u5e38\uff0c\u800c\u884c\u52a8\u5141\u8bb8\u5b83\u4e0e\u5916\u90e8\u6765\u6e90(\u5982\u77e5\u8bc6\u5e93\u6216\u73af\u5883)\u4ea4\u4e92\u5e76\u6536\u96c6\u989d\u5916\u7684\u4fe1\u606f\u3002\u5c06\u6240\u63d0\u51fa\u65b9\u6cd5ReAct\u5e94\u7528\u4e8e\u4e00\u7ec4\u4e0d\u540c\u7684\u8bed\u8a00\u548c\u51b3\u7b56\u4efb\u52a1\uff0c\u5e76\u5728\u6700\u5148\u8fdb\u7684\u57fa\u7ebf\u4e0a\u8bc1\u660e\u4e86\u5176\u6709\u6548\u6027\uff0c\u6b64\u5916\u8fd8\u63d0\u9ad8\u4e86\u4eba\u7c7b\u7684\u53ef\u89e3\u91ca\u6027\u548c\u53ef\u4fe1\u6027\u3002\u5177\u4f53\u800c\u8a00\uff0c\u5728\u95ee\u9898\u56de\u7b54(HotpotQA)\u548c\u4e8b\u5b9e\u9a8c\u8bc1(Fever)\u4e2d\uff0cReAct\u514b\u670d\u4e86\u601d\u7ef4\u94fe\u63a8\u7406\u4e2d\u666e\u904d\u5b58\u5728\u7684\u5e7b\u89c9\u548c\u9519\u8bef\u4f20\u64ad\u95ee\u9898\u901a\u8fc7\u4e0e\u7b80\u5355\u7684\u7ef4\u57fa\u767e\u79d1API\u4ea4\u4e92\uff0c\u5e76\u751f\u6210\u7c7b\u4f3c\u4eba\u7c7b\u7684\u4efb\u52a1\u89e3\u51b3\u8f68\u8ff9\uff0c\u8fd9\u4e9b\u8f68\u8ff9\u6bd4\u6ca1\u6709\u63a8\u7406\u8f68\u8ff9\u7684\u57fa\u7ebf\u66f4\u5bb9\u6613\u89e3\u91ca\u3002\u6b64\u5916\uff0c\u5728\u4e24\u4e2a\u4ea4\u4e92\u5f0f\u51b3\u7b56\u57fa\u51c6(ALFWorld\u548cWebShop)\u4e0a\uff0cReAct\u6bd4\u6a21\u4eff\u548c\u5f3a\u5316\u5b66\u4e60\u65b9\u6cd5\u7684\u7edd\u5bf9\u6210\u529f\u7387\u5206\u522b\u4e3a34\uff05\u548c10\uff05\uff0c\u800c\u53ea\u9700\u8981\u4e00\u4e2a\u6216\u4e24\u4e2a\u4e0a\u4e0b\u6587\u793a\u4f8b\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>1 \u5f15\u8a00<\/h2>\n<p>&nbsp;<\/p>\n<p>\u4eba\u7c7b\u667a\u80fd\u7684\u4e00\u4e2a\u72ec\u7279\u7279\u6027\u662f\u80fd\u591f\u65e0\u7f1d\u5730\u5c06\u9762\u5411\u4efb\u52a1\u7684\u884c\u52a8\u4e0e\u8a00\u8bed\u63a8\u7406\u7ed3\u5408\u8d77\u6765\uff0c\u8fd9\u88ab\u8ba4\u4e3a\u5728\u4eba\u7c7b\u8ba4\u77e5\u4e2d\u626e\u6f14\u7740\u91cd\u8981\u89d2\u8272\uff0c\u6709\u52a9\u4e8e\u81ea\u6211\u8c03\u8282\u6216\u7b56\u7565\u5236\u5b9a\u4ee5\u53ca\u7ef4\u6301\u5de5\u4f5c\u8bb0\u5fc6\u3002\u4ee5\u5728\u53a8\u623f\u91cc\u70f9\u996a\u4e00\u9053\u83dc\u4e3a\u4f8b\uff0c\u5728\u4e24\u4e2a\u5177\u4f53\u52a8\u4f5c\u4e4b\u95f4\uff0c\u6211\u4eec\u53ef\u80fd\u4f1a\u7528\u8bed\u8a00\u6765\u63a8\u7406\u4ee5\u8ddf\u8e2a\u8fdb\u5ea6\uff08\u201c\u73b0\u5728\u6240\u6709\u4e1c\u897f\u90fd\u5207\u597d\u4e86\uff0c\u6211\u5e94\u8be5\u628a\u6c34\u9505\u52a0\u70ed\u201d\uff09\uff0c\u5904\u7406\u5f02\u5e38\u6216\u6839\u636e\u60c5\u51b5\u8c03\u6574\u8ba1\u5212\uff08\u201c\u6211\u6ca1\u6709\u76d0\uff0c\u90a3\u4e48\u8ba9\u6211\u7528\u9171\u6cb9\u548c\u80e1\u6912\u4ee3\u66ff\u201d\uff09\uff0c\u4ee5\u53ca\u610f\u8bc6\u5230\u4f55\u65f6\u9700\u8981\u5916\u90e8\u4fe1\u606f\uff08\u201c\u6211\u8be5\u5982\u4f55\u51c6\u5907\u9762\u56e2\uff1f\u8ba9\u6211\u4e0a\u7f51\u641c\u7d22\u4e00\u4e0b\u201d\uff09\u3002\u6211\u4eec\u4e5f\u53ef\u80fd\u91c7\u53d6\u884c\u52a8\uff08\u6253\u5f00\u98df\u8c31\u4e66\u9605\u8bfb\u98df\u8c31\uff0c\u6253\u5f00\u51b0\u7bb1\uff0c\u68c0\u67e5\u98df\u6750\uff09\u6765\u652f\u6301\u63a8\u7406\u548c\u56de\u7b54\u95ee\u9898\uff08\u201c\u6211\u73b0\u5728\u80fd\u505a\u4ec0\u4e48\u83dc\uff1f\u201d\uff09\u3002\u8fd9\u79cd\u201c\u884c\u52a8\u201d\u4e0e\u201c\u63a8\u7406\u201d\u4e4b\u95f4\u7684\u7d27\u5bc6\u534f\u540c\u4f5c\u7528\uff0c\u4f7f\u4eba\u7c7b\u80fd\u591f\u5feb\u901f\u5b66\u4e60\u65b0\u4efb\u52a1\uff0c\u5e76\u5728\u4e4b\u524d\u672a\u9047\u5230\u7684\u73af\u5883\u6216\u9762\u5bf9\u4fe1\u606f\u4e0d\u786e\u5b9a\u6027\u65f6\uff0c\u8fdb\u884c\u7a33\u5065\u7684\u51b3\u7b56\u6216\u63a8\u7406\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>\u6700\u8fd1\u7684\u6210\u679c\u5df2\u7ecf\u6697\u793a\u4e86\u5c06\u8a00\u8bed\u63a8\u7406\u4e0e\u81ea\u4e3b\u7cfb\u7edf\u7684\u4ea4\u4e92\u5f0f\u51b3\u7b56\u5236\u5b9a\u7ed3\u5408\u8d77\u6765\u7684\u53ef\u80fd\u6027\u3002\u4e00\u65b9\u9762\uff0c\u9002\u5f53\u5f15\u5bfc\u7684\u5927\u578b\u8bed\u8a00\u6a21\u578b\uff08LLMs\uff09\u5df2\u7ecf\u5c55\u73b0\u51fa\u5728\u7b97\u672f\u3001\u5e38\u8bc6\u548c\u7b26\u53f7\u63a8\u7406\u4efb\u52a1\u4e2d\u8fdb\u884c\u51e0\u6b65\u63a8\u7406\u7684\u80fd\u529b\u3002\u7136\u800c\uff0c\u8fd9\u79cd\u201c\u601d\u7ef4\u94fe\u201d\u63a8\u7406\u662f\u4e00\u4e2a\u9759\u6001\u7684\u9ed1\u7bb1\uff0c\u6a21\u578b\u4f7f\u7528\u5176\u5185\u90e8\u8868\u793a\u6765\u751f\u6210\u601d\u8003\uff0c\u5e76\u4e14\u4e0d\u57fa\u4e8e\u5916\u90e8\u4e16\u754c\uff0c\u8fd9\u9650\u5236\u4e86\u5176\u53cd\u5e94\u6027\u63a8\u7406\u6216\u66f4\u65b0\u77e5\u8bc6\u7684\u80fd\u529b\u3002\u8fd9\u53ef\u80fd\u5bfc\u81f4\u4e8b\u5b9e\u5e7b\u89c9\u548c\u63a8\u7406\u8fc7\u7a0b\u4e2d\u7684\u9519\u8bef\u4f20\u64ad\uff08\u56fe1\uff081b\uff09\uff09\u3002\u53e6\u4e00\u65b9\u9762\uff0c\u6700\u8fd1\u7684\u5de5\u4f5c\u63a2\u7d22\u4e86\u5728\u4ea4\u4e92\u5f0f\u73af\u5883\u4e2d\u4f7f\u7528\u9884\u8bad\u7ec3\u8bed\u8a00\u6a21\u578b\u8fdb\u884c\u89c4\u5212\u548c\u884c\u52a8\uff0c\u91cd\u70b9\u662f\u901a\u8fc7\u8bed\u8a00\u5148\u9a8c\u6765\u9884\u6d4b\u884c\u52a8\u3002\u8fd9\u4e9b\u65b9\u6cd5\u901a\u5e38\u5c06\u591a\u6a21\u6001\u89c2\u5bdf\u8f6c\u6362\u4e3a\u6587\u672c\uff0c\u4f7f\u7528\u8bed\u8a00\u6a21\u578b\u751f\u6210\u7279\u5b9a\u9886\u57df\u7684\u884c\u52a8\u6216\u8ba1\u5212\uff0c\u7136\u540e\u4f7f\u7528\u63a7\u5236\u5668\u6765\u9009\u62e9\u6216\u6267\u884c\u5b83\u4eec\u3002\u7136\u800c\uff0c\u5b83\u4eec\u5e76\u4e0d\u4f7f\u7528\u8bed\u8a00\u6a21\u578b\u6765\u62bd\u8c61\u5730\u63a8\u7406\u9ad8\u5c42\u6b21\u76ee\u6807\u6216\u7ef4\u6301\u5de5\u4f5c\u8bb0\u5fc6\u4ee5\u652f\u6301\u884c\u52a8\uff0c\u9664\u4e86Huang et al. (2022b)\u8fdb\u884c\u4e86\u6709\u9650\u5f62\u5f0f\u7684\u8a00\u8bed\u63a8\u7406\uff0c\u4ee5\u91cd\u7533\u5f53\u524d\u72b6\u6001\u7684\u7a7a\u95f4\u4e8b\u5b9e\u3002\u9664\u4e86\u8fd9\u79cd\u7b80\u5355\u7684\u5177\u8eab\u4efb\u52a1\u4e0e\u51e0\u4e2a\u79ef\u6728\u4e92\u52a8\u4e4b\u5916\uff0c\u8fd8\u6ca1\u6709\u7814\u7a76\u5982\u4f55\u5c06\u63a8\u7406\u548c\u884c\u52a8\u4ee5\u534f\u540c\u7684\u65b9\u5f0f\u7ed3\u5408\u8d77\u6765\u89e3\u51b3\u4e00\u822c\u4efb\u52a1\uff0c\u4ee5\u53ca\u8fd9\u79cd\u7ed3\u5408\u76f8\u6bd4\u5355\u72ec\u63a8\u7406\u6216\u884c\u52a8\u662f\u5426\u80fd\u591f\u5e26\u6765\u7cfb\u7edf\u6027\u7684\u597d\u5904\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2529\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-1\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/a1a912c45429c0c.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-1\" width=\"987\" height=\"814\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/a1a912c45429c0c.png 987w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/a1a912c45429c0c-300x247.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/a1a912c45429c0c-768x633.png 768w\" sizes=\"auto, (max-width: 987px) 100vw, 987px\" \/><\/p>\n<p>\u56fe 1\uff1a(1) \u6bd4\u8f83\u4e864\u79cd\u63d0\u793a\u65b9\u6cd5\uff0c(a) \u6807\u51c6\u63d0\u793a\uff0c(b) \u601d\u7ef4\u94fe\uff08CoT\uff0c\u4ec5\u63a8\u7406\uff09\uff0c(c) \u4ec5\u884c\u52a8\uff0c\u4ee5\u53ca (d) ReAct\uff08\u63a8\u7406+\u884c\u52a8\uff09\uff0c\u89e3\u51b3\u4e00\u4e2aHotpotQA\uff08Yang\u7b49\u4eba\uff0c2018\u5e74\uff09\u95ee\u9898\u3002(2) \u6bd4\u8f83\u4e86 (a) \u4ec5\u884c\u52a8\u548c (b) ReAct\u63d0\u793a\u65b9\u6cd5\u89e3\u51b3\u4e00\u4e2aAlfWorld\uff08Shridhar\u7b49\u4eba\uff0c2020b\uff09\u6e38\u620f\u3002\u5728\u8fd9\u4e24\u4e2a\u9886\u57df\u4e2d\uff0c\u6211\u4eec\u5728\u63d0\u793a\u4e2d\u7701\u7565\u4e86\u4e0a\u4e0b\u6587\u793a\u4f8b\uff0c\u4ec5\u5c55\u793a\u4e86\u7531\u6a21\u578b\uff08\u884c\u52a8\uff0c\u601d\u8003\uff09\u548c\u73af\u5883\uff08\u89c2\u5bdf\uff09\u751f\u6210\u7684\u95ee\u9898\u89e3\u51b3\u8f68\u8ff9\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>\u672c\u6587\u63d0\u51fa<sub>ReAct<\/sub>\uff0c\u4e00\u79cd\u5c06\u63a8\u7406\u548c\u884c\u52a8\u4e0e\u8bed\u8a00\u6a21\u578b\u76f8\u7ed3\u5408\u7684\u901a\u7528\u8303\u5f0f\uff0c\u4ee5\u89e3\u51b3\u5404\u79cd\u8bed\u8a00\u63a8\u7406\u548c\u51b3\u7b56\u4efb\u52a1(\u56fe1)\u3002ReAct\u63d0\u793allm\u4ee5\u4ea4\u53c9\u7684\u65b9\u5f0f\u751f\u6210\u4e0e\u4efb\u52a1\u76f8\u5173\u7684\u53e3\u5934\u63a8\u7406\u75d5\u8ff9\u548c\u884c\u52a8\uff0c\u8fd9\u5141\u8bb8\u6a21\u578b\u6267\u884c\u52a8\u6001\u63a8\u7406\u4ee5\u521b\u5efa\u3001\u7ef4\u62a4\u548c\u8c03\u6574\u884c\u52a8\u7684\u9ad8\u7ea7\u8ba1\u5212(\u7406\u7531\u884c\u52a8)\uff0c\u540c\u65f6\u4e0e\u5916\u90e8\u73af\u5883(\u4f8b\u5982\uff1a\u7ef4\u57fa\u767e\u79d1)\u4ea4\u4e92\uff0c\u5c06\u989d\u5916\u7684\u4fe1\u606f\u7eb3\u5165\u63a8\u7406(\u884c\u52a8\u63a8\u7406)\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>\u672c\u6587\u5728\u56db\u4e2a\u4e0d\u540c\u7684\u57fa\u51c6\u4e0a\u5bf9ReAct\u548c\u6700\u5148\u8fdb\u7684\u57fa\u7ebf\u8fdb\u884c\u4e86\u5b9e\u8bc1\u8bc4\u4f30:\u95ee\u7b54\u3001\u4e8b\u5b9e\u9a8c\u8bc1\u3001\u6587\u672c\u6e38\u620f\u548c\u7f51\u9875\u5bfc\u822a\u3002\u5bf9\u4e8eHotPotQA\u548cFever\uff0c\u901a\u8fc7\u8bbf\u95ee\u6a21\u578b\u53ef\u4ee5\u4ea4\u4e92\u7684\u7ef4\u57fa\u767e\u79d1API, ReAct\u4f18\u4e8e\u666e\u901a\u7684\u52a8\u4f5c\u751f\u6210\u6a21\u578b\uff0c\u540c\u65f6\u4e0e\u601d\u7ef4\u94fe\u63a8\u7406(CoT) \u7ade\u4e89\u3002\u603b\u7684\u6765\u8bf4\uff0c\u6700\u597d\u7684\u65b9\u6cd5\u662fReAct\u548cCoT\u7684\u7ed3\u5408\uff0c\u8fd9\u5141\u8bb8\u5728\u63a8\u7406\u8fc7\u7a0b\u4e2d\u4f7f\u7528\u5185\u90e8\u77e5\u8bc6\u548c\u5916\u90e8\u83b7\u5f97\u7684\u4fe1\u606f\u3002\u5728ALFWorld\u548cWebShop\u4e0a\uff0c\u4e24\u6b21\u751a\u81f3\u4e00\u6b21ReAct\u63d0\u793a\u80fd\u591f\u80dc\u8fc7\u752810<sup>3 <\/sup>\u223c 10<sup>5<\/sup>\u4efb\u52a1\u5b9e\u4f8b\u8bad\u7ec3\u7684\u6a21\u4eff\u6216\u5f3a\u5316\u5b66\u4e60\u65b9\u6cd5\uff0c\u6210\u529f\u7387\u5206\u522b\u7edd\u5bf9\u63d0\u9ad834\uff05\u548c10\uff05\u3002\u901a\u8fc7\u663e\u793a\u51fa\u6bd4\u53ea\u91c7\u53d6\u884c\u52a8\u7684\u53d7\u63a7\u57fa\u7ebf\u7684\u4e00\u81f4\u4f18\u52bf\uff0c\u8bc1\u660e\u4e86\u7a00\u758f\u7684\u3001\u901a\u7528\u7684\u63a8\u7406\u5728\u51b3\u7b56\u4e2d\u7684\u91cd\u8981\u6027\u3002\u9664\u4e86\u666e\u904d\u9002\u7528\u6027\u548c\u6027\u80fd\u63d0\u5347\u5916\uff0c\u63a8\u7406\u548c\u884c\u52a8\u7684\u7ed3\u5408\u8fd8\u6709\u52a9\u4e8e\u6a21\u578b\u7684\u53ef\u89e3\u91ca\u6027\u3001\u53ef\u4fe1\u6027\u548c\u8de8\u6240\u6709\u9886\u57df\u7684\u53ef\u8bca\u65ad\u6027\uff0c\u56e0\u4e3a\u4eba\u7c7b\u53ef\u4ee5\u5f88\u5bb9\u6613\u5730\u533a\u5206\u6765\u81ea\u6a21\u578b\u5185\u90e8\u77e5\u8bc6\u7684\u4fe1\u606f\u4e0e\u5916\u90e8\u73af\u5883\u7684\u533a\u522b\uff0c\u4ee5\u53ca\u68c0\u67e5\u63a8\u7406\u8f68\u8ff9\u4ee5\u4e86\u89e3\u6a21\u578b\u884c\u52a8\u7684\u51b3\u7b56\u57fa\u7840\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>\u603b\u800c\u8a00\u4e4b\uff0c\u6211\u4eec\u7684\u4e3b\u8981\u8d21\u732e\u5982\u4e0b:<\/p>\n<p>(1)\u63d0\u51faReAct\uff0c\u4e00\u79cd\u65b0\u7684\u57fa\u4e8e\u63d0\u793a\u7684\u8303\u5f0f\uff0c\u5728\u8bed\u8a00\u6a21\u578b\u4e2d\u534f\u540c\u63a8\u7406\u548c\u884c\u52a8\uff0c\u4ee5\u89e3\u51b3\u4e00\u822c\u4efb\u52a1;<\/p>\n<p>(2)\u5728\u4e0d\u540c\u7684\u57fa\u51c6\u4e0a\u8fdb\u884c\u4e86\u5e7f\u6cdb\u7684\u5b9e\u9a8c\uff0c\u4ee5\u5c55\u793aReAct\u5728\u5c11\u6837\u672c\u5b66\u4e60\u8bbe\u7f6e\u4e2d\u6bd4\u4e4b\u524d\u5355\u72ec\u8fdb\u884c\u63a8\u7406\u6216\u52a8\u4f5c\u751f\u6210\u7684\u65b9\u6cd5\u7684\u4f18\u52bf;<\/p>\n<p>(3)\u63d0\u51fa\u7cfb\u7edf\u6d88\u878d\u548c\u5206\u6790\uff0c\u4ee5\u4e86\u89e3\u884c\u52a8\u5728\u63a8\u7406\u4efb\u52a1\u4e2d\u7684\u91cd\u8981\u6027\uff0c\u4ee5\u53ca\u63a8\u7406\u5728\u4ea4\u4e92\u4efb\u52a1\u4e2d\u7684\u91cd\u8981\u6027;<\/p>\n<p>(4)\u5206\u6790\u4e86ReAct\u5728\u63d0\u793a\u8bbe\u7f6e\u4e0b\u7684\u5c40\u9650\u6027(\u5373\uff1a\u5bf9\u63a8\u7406\u548c\u884c\u4e3a\u7684\u652f\u6301\u6709\u9650)\uff0c\u5e76\u8fdb\u884c\u4e86\u521d\u6b65\u7684\u5fae\u8c03\u5b9e\u9a8c\uff0c\u663e\u793a\u4e86ReAct\u901a\u8fc7\u989d\u5916\u7684\u8bad\u7ec3\u6570\u636e\u8fdb\u884c\u6539\u8fdb\u7684\u6f5c\u529b\u3002\u6269\u5c55ReAct\u4ee5\u8bad\u7ec3\u548c\u64cd\u4f5c\u66f4\u591a\u7684\u4efb\u52a1\uff0c\u5e76\u5c06\u5176\u4e0e\u5f3a\u5316\u5b66\u4e60\u7b49\u4e92\u8865\u8303\u5f0f\u76f8\u7ed3\u5408\uff0c\u53ef\u4ee5\u8fdb\u4e00\u6b65\u91ca\u653e\u5927\u578b\u8bed\u8a00\u6a21\u578b\u7684\u6f5c\u529b\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>2 REACT:\u534f\u540c\u63a8\u7406+\u884c\u52a8<\/h2>\n<p>&nbsp;<\/p>\n<p>\u8003\u8651\u4e00\u4e2a\u4e0e\u73af\u5883\u4ea4\u4e92\u4ee5\u89e3\u51b3\u4efb\u52a1\u7684\u667a\u80fd\u4f53\u7684\u4e00\u822c\u8bbe\u7f6e\u3002\u5728\u65f6\u95f4\u6b65\u9aa4<em>t<\/em>\u4e0a\uff0c\u4ee3\u7406\u4ece\u73af\u5883\u4e2d\u63a5\u6536\u5230\u4e00\u4e2a\u89c2\u5bdf\u7ed3\u679c<em>o<sub>t <\/sub><\/em>\u2208 O\uff0c\u5e76\u6839\u636e\u67d0\u4e9b\u7b56\u7565<em>\u03c0<\/em>(<em>a<sub>t<\/sub><\/em>|<em>c<sub>t<\/sub><\/em>)\u91c7\u53d6\u4e00\u4e2a\u64cd\u4f5c<em>a<sub>t <\/sub><\/em>\u2208 A\uff0c\u5176\u4e2d<em>c<sub>t <\/sub><\/em>= (<em>o<\/em><sub>1<\/sub><em>,a<\/em><sub>1<\/sub><em>,<\/em>\u00b7\u00b7\u00b7 <em>,o<sub>t<\/sub><\/em><sub>\u22121<\/sub><em>,a<sub>t<\/sub><\/em><sub>\u22121<\/sub><em>,o<sub>t<\/sub><\/em>)\u662f\u4ee3\u7406\u7684\u4e0a\u4e0b\u6587\u3002\u5f53\u6620\u5c04<em>c<sub>t <\/sub><\/em>\u21927 <em>a<sub>t<\/sub><\/em>\u662f\u9ad8\u5ea6\u9690\u5f0f\u7684\u5e76\u4e14\u9700\u8981\u5927\u91cf\u8ba1\u7b97\u65f6\uff0c\u5b66\u4e60\u7b56\u7565\u662f\u5177\u6709\u6311\u6218\u6027\u7684\u3002\u4f8b\u5982\uff0c\u56fe1 (1c)\u6240\u793a\u7684\u4ee3\u7406\u65e0\u6cd5\u751f\u6210\u6b63\u786e\u7684\u6700\u7ec8\u52a8\u4f5c(Act 4)\u6765\u5b8c\u6210QA\u4efb\u52a1\uff0c\u56e0\u4e3a\u5b83\u9700\u8981\u5bf9\u8f68\u8ff9\u4e0a\u4e0b\u6587(\u95ee\u9898\uff0cAct 1-3, Obs 1-3)\u8fdb\u884c\u590d\u6742\u7684\u63a8\u7406\u3002\u7c7b\u4f3c\u5730\uff0c\u5982\u56fe1 (2a)\u6240\u793a\u7684\u4ee3\u7406\u65e0\u6cd5\u4ece\u4e0a\u4e0b\u6587\u4e2d\u7406\u89e3\u6c34\u69fd1\u4e0d\u5305\u542b\u80e1\u6912\u74f61\uff0c\u56e0\u6b64\u4e0d\u65ad\u4ea7\u751f\u5e7b\u89c9\u884c\u4e3a\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>ReAct\u7684\u60f3\u6cd5\u5f88\u7b80\u5355:\u6211\u4eec\u5c06\u667a\u80fd\u4f53\u7684\u52a8\u4f5c\u7a7a\u95f4\u6269\u5927\u5230A\u02c6 = A \u222a L\uff0c\u5176\u4e2dL\u662f\u8bed\u8a00\u7a7a\u95f4\u3002\u8bed\u8a00\u7a7a\u95f4\u4e2d\u7684\u4e00\u4e2a\u52a8\u4f5c<em>a<\/em>\u02c6<em><sub>t <\/sub><\/em>\u2208 L\uff0c\u6211\u4eec\u5c06\u5176\u79f0\u4e3a\u601d\u60f3\u6216\u63a8\u7406\u75d5\u8ff9\uff0c\u4e0d\u4f1a\u5f71\u54cd\u5916\u90e8\u73af\u5883\uff0c\u56e0\u6b64\u4e0d\u4f1a\u5bfc\u81f4\u89c2\u5bdf\u53cd\u9988\u3002\u76f8\u53cd\uff0c\u4e00\u4e2a\u601d\u60f3<em>a<\/em>\u02c6<em><sub>t<\/sub><\/em>\u65e8\u5728\u901a\u8fc7\u5bf9\u5f53\u524d\u4e0a\u4e0b\u6587\u7684\u63a8\u7406\u7f16\u5199\u6709\u7528\u7684\u4fe1\u606f<em>c<sub>t<\/sub><\/em>\uff0c\u5e76\u66f4\u65b0\u4e0a\u4e0b\u6587<em>c<sub>t<\/sub><\/em><sub>+1 <\/sub>= (<em>c<sub>t<\/sub>,a<\/em>\u02c6<em><sub>t<\/sub><\/em>)\u4ee5\u652f\u6301\u672a\u6765\u7684\u63a8\u7406\u6216\u884c\u52a8\u3002\u5982\u56fe1\u6240\u793a\uff0c\u53ef\u4ee5\u6709\u5404\u79cd\u7c7b\u578b\u7684\u6709\u7528\u7684\u60f3\u6cd5\uff0c\u4f8b\u5982\uff1a\u5206\u89e3\u4efb\u52a1\u76ee\u6807\u548c\u521b\u5efa\u884c\u52a8\u8ba1\u5212(2b, Act 1;1d\uff0c\u601d\u60f31)\uff0c\u6ce8\u5165\u4e0e\u4efb\u52a1\u89e3\u51b3\u76f8\u5173\u7684\u5e38\u8bc6\u77e5\u8bc6(2b\uff0c\u601d\u60f31)\uff0c\u4ece\u89c2\u5bdf\u4e2d\u63d0\u53d6\u91cd\u8981\u90e8\u5206(1d\uff0c\u601d\u60f32,4)\uff0c\u8ddf\u8e2a\u8fdb\u5c55\u548c\u8fd0\u8f93\u884c\u52a8\u8ba1\u5212(2b\uff0c\u601d\u60f38)\uff0c\u5904\u7406\u5f02\u5e38\u548c\u8c03\u6574\u884c\u52a8\u8ba1\u5212(1d\uff0c\u601d\u60f33)\uff0c\u7b49\u7b49\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>\u7136\u800c\uff0c\u7531\u4e8e\u8bed\u8a00\u7a7a\u95f4L\u662f\u65e0\u9650\u7684\uff0c\u5728\u8fd9\u4e2a\u589e\u5f3a\u7684\u884c\u52a8\u7a7a\u95f4\u4e2d\u5b66\u4e60\u662f\u56f0\u96be\u7684\uff0c\u9700\u8981\u5f88\u5f3a\u7684\u8bed\u8a00\u5148\u9a8c\u3002\u5728\u672c\u6587\u4e2d\uff0c\u6211\u4eec\u4e3b\u8981\u5173\u6ce8\u5728\u8fd9\u4e2a\u8bbe\u7f6e\u4e2d\uff0c\u4e00\u4e2a\u51bb\u7ed3\u7684\u5927\u578b\u8bed\u8a00\u6a21\u578bPaLM-540B (Chowdhery et al., 2022)<a href=\"#_ftn1\" name=\"_ftnref1\"><sup>[1]<\/sup><\/a>\u7528\u5c11\u6837\u672c\u7684\u4e0a\u4e0b\u6587\u793a\u4f8b\u6765\u63d0\u793a\uff0c\u4ee5\u751f\u6210\u7279\u5b9a\u9886\u57df\u7684\u52a8\u4f5c\u548c\u81ea\u7531\u5f62\u5f0f\u7684\u8bed\u8a00\u601d\u60f3\uff0c\u7528\u4e8e\u4efb\u52a1\u89e3\u51b3(\u56fe1 (1d)\uff0c(2b))\u3002\u6bcf\u4e2a\u4e0a\u4e0b\u6587\u4e2d\u7684\u793a\u4f8b\u90fd\u662f\u7528\u4e8e\u89e3\u51b3\u4efb\u52a1\u5b9e\u4f8b\u7684\u4eba\u7c7b\u884c\u52a8\u3001\u601d\u60f3\u548c\u73af\u5883\u89c2\u5bdf\u7684\u8f68\u8ff9(\u53c2\u89c1\u9644\u5f55C)\u3002\u5bf9\u4e8e\u63a8\u7406\u5177\u6709\u9996\u8981\u91cd\u8981\u6027\u7684\u4efb\u52a1(\u56fe1(1))\uff0c\u6211\u4eec\u4ea4\u66ff\u751f\u6210\u601d\u60f3\u548c\u884c\u52a8\uff0c\u4ee5\u4fbf\u4efb\u52a1\u89e3\u51b3\u8f68\u8ff9\u7531\u591a\u4e2a\u601d\u60f3-\u884c\u52a8-\u89c2\u5bdf\u6b65\u9aa4\u7ec4\u6210\u3002\u76f8\u6bd4\u4e4b\u4e0b\uff0c\u5bf9\u4e8e\u53ef\u80fd\u6d89\u53ca\u5927\u91cf\u884c\u52a8\u7684\u51b3\u7b56\u4efb\u52a1(\u56fe1(2))\uff0c\u601d\u60f3\u53ea\u9700\u8981\u7a00\u758f\u5730\u51fa\u73b0\u5728\u8f68\u8ff9\u7684\u6700\u76f8\u5173\u4f4d\u7f6e\uff0c\u56e0\u6b64\u6211\u4eec\u8ba9\u8bed\u8a00\u6a21\u578b\u4e3a\u81ea\u5df1\u51b3\u5b9a\u601d\u60f3\u548c\u884c\u52a8\u7684\u5f02\u6b65\u53d1\u751f\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>\u7531\u4e8e\u51b3\u7b56\u548c\u63a8\u7406\u80fd\u529b\u96c6\u6210\u5230\u4e00\u4e2a\u5927\u578b\u8bed\u8a00\u6a21\u578b\u4e2d\uff0cReAct\u5177\u6709\u4ee5\u4e0b\u51e0\u4e2a\u72ec\u7279\u7684\u7279\u70b9:<\/p>\n<p><strong>A)\u76f4\u89c2\u4e14\u6613\u4e8e\u8bbe\u8ba1\uff1a<\/strong>\u8bbe\u8ba1ReAct\u63d0\u793a\u5f88\u7b80\u5355\uff0c\u56e0\u4e3a\u4eba\u7c7b\u6ce8\u91ca\u8005\u53ea\u9700\u5728\u4ed6\u4eec\u7684\u884c\u52a8\u4e4b\u4e0a\u7528\u8bed\u8a00\u8868\u8fbe\u4ed6\u4eec\u7684\u60f3\u6cd5\u3002\u672c\u6587\u6ca1\u6709\u4f7f\u7528\u7279\u5b9a\u7684\u683c\u5f0f\u9009\u62e9\u3001\u601d\u8003\u8bbe\u8ba1\u6216\u793a\u4f8b\u9009\u62e9\u3002\u6211\u4eec\u5728\u7b2c3\u8282\u548c\u7b2c4\u8282\u8be6\u7ec6\u63cf\u8ff0\u4e86\u6bcf\u9879\u4efb\u52a1\u7684\u63d0\u793a\u8bbe\u8ba1\u3002<\/p>\n<p><strong>B)\u901a\u7528\u4e14\u7075\u6d3b\uff1a<\/strong>\u7531\u4e8e\u7075\u6d3b\u7684\u601d\u8003\u7a7a\u95f4\u548c\u601d\u8003-\u884c\u52a8\u53d1\u751f\u683c\u5f0f\uff0cReAct\u9002\u7528\u4e8e\u5177\u6709\u4e0d\u540c\u884c\u52a8\u7a7a\u95f4\u548c\u63a8\u7406\u9700\u6c42\u7684\u591a\u6837\u5316\u4efb\u52a1\uff0c\u5305\u62ec\u4f46\u4e0d\u9650\u4e8eQA\u3001\u4e8b\u5b9e\u9a8c\u8bc1\u3001\u6587\u672c\u6e38\u620f\u548c\u7f51\u9875\u5bfc\u822a\u3002<\/p>\n<p><strong>C)\u6027\u80fd\u5f3a\u5927\u4e14\u7a33\u5065\uff1a<\/strong>ReAct\u5728\u5b66\u4e60\u4ec5\u4ece\u4e00\u4e2a\u5230\u516d\u4e2a\u4e0a\u4e0b\u6587\u793a\u4f8b\u65f6\u5c55\u73b0\u51fa\u5f3a\u5927\u7684\u6cdb\u5316\u80fd\u529b\uff0c\u59cb\u7ec8\u5728\u4e0d\u540c\u9886\u57df\u4e2d\u4e00\u81f4\u5730\u8d85\u8d8a\u53ea\u6709\u63a8\u7406\u6216\u884c\u52a8\u7684\u57fa\u7ebf\u3002\u6211\u4eec\u8fd8\u5728\u7b2c3\u8282\u5c55\u793a\u4e86\u542f\u7528\u5fae\u8c03\u65f6\u7684\u989d\u5916\u597d\u5904\uff0c\u5728\u7b2c4\u8282\u5c55\u793a\u4e86ReAct\u6027\u80fd\u5bf9\u63d0\u793a\u9009\u62e9\u7684\u7a33\u5065\u6027\u3002<\/p>\n<p><strong> D)\u4e0e\u4eba\u7c7b\u5bf9\u9f50\u4e14\u53ef\u63a7\uff1a<\/strong>ReAct\u627f\u8bfa\u4e00\u4e2a\u53ef\u89e3\u91ca\u7684\u987a\u5e8f\u51b3\u7b56\u5236\u5b9a\u548c\u63a8\u7406\u8fc7\u7a0b\uff0c\u4eba\u7c7b\u53ef\u4ee5\u8f7b\u677e\u68c0\u67e5\u63a8\u7406\u548c\u4e8b\u5b9e\u6b63\u786e\u6027\u3002\u6b64\u5916\uff0c\u6b63\u5982\u7b2c4\u8282\u4e2d\u7684\u56fe5\u6240\u793a\uff0c\u4eba\u7c7b\u8fd8\u53ef\u4ee5\u901a\u8fc7\u601d\u8003\u7f16\u8f91\u6765\u63a7\u5236\u6216\u7ea0\u6b63\u667a\u80fd\u4f53\u884c\u4e3a\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>3 \u77e5\u8bc6\u5bc6\u96c6\u578b\u63a8\u7406\u4efb\u52a1<\/h2>\n<p>&nbsp;<\/p>\n<p>\u4ece\u77e5\u8bc6\u5bc6\u96c6\u578b\u63a8\u7406\u4efb\u52a1\u5f00\u59cb\uff0c\u5982\u591a\u8df3\u95ee\u7b54\u548c\u4e8b\u5b9e\u9a8c\u8bc1\u3002\u5982\u56fe1 (1d)\u6240\u793a\uff0c\u901a\u8fc7\u4e0e\u7ef4\u57fa\u767e\u79d1API\u4ea4\u4e92\uff0cReAct\u80fd\u591f\u68c0\u7d22\u4fe1\u606f\u4ee5\u652f\u6301\u63a8\u7406\uff0c\u540c\u65f6\u4e5f\u4f7f\u7528\u63a8\u7406\u6765\u786e\u5b9a\u4e0b\u4e00\u6b65\u8981\u68c0\u7d22\u7684\u5185\u5bb9\uff0c\u5c55\u793a\u4e86\u63a8\u7406\u548c\u884c\u52a8\u7684\u534f\u540c\u4f5c\u7528\u3002<\/p>\n<p>&nbsp;<\/p>\n<h3>3.1 \u8bbe\u7f6e<\/h3>\n<p><strong>\u9886\u57df\uff08Domains\uff09<\/strong> \u6211\u4eec\u8003\u8651\u4e24\u4e2a\u6570\u636e\u96c6\uff0c\u5b83\u4eec\u5bf9\u77e5\u8bc6\u68c0\u7d22\u548c\u63a8\u7406\u63d0\u51fa\u4e86\u6311\u6218\uff1a(1) HotPotQA \uff0c\u8fd9\u662f\u4e00\u4e2a\u9700\u8981\u5728\u4e24\u7bc7\u6216\u66f4\u591a\u7ef4\u57fa\u767e\u79d1\u6587\u7ae0\u4e0a\u8fdb\u884c\u63a8\u7406\u7684\u591a\u8df3\u95ee\u9898\u56de\u7b54\u57fa\u51c6\uff1b(2) FEVER\uff0c\u8fd9\u662f\u4e00\u4e2a\u4e8b\u5b9e\u9a8c\u8bc1\u57fa\u51c6\uff0c\u6bcf\u4e2a\u58f0\u660e\u90fd\u88ab\u6807\u6ce8\u4e3aSUPPORTS\uff08\u652f\u6301\uff09\u3001REFUTES\uff08\u53cd\u9a73\uff09\u6216NOT ENOUGH INFO\uff08\u4fe1\u606f\u4e0d\u8db3\uff09\uff0c\u8fd9\u53d6\u51b3\u4e8e\u662f\u5426\u5b58\u5728\u7ef4\u57fa\u767e\u79d1\u6587\u7ae0\u6765\u9a8c\u8bc1\u8be5\u58f0\u660e\u3002\u5728\u8fd9\u9879\u5de5\u4f5c\u4e2d\uff0c\u6211\u4eec\u5728\u4e24\u4e2a\u4efb\u52a1\u4e2d\u90fd\u91c7\u7528\u4ec5\u95ee\u9898\u7684\u8bbe\u7f6e\uff0c\u6a21\u578b\u53ea\u63a5\u6536\u95ee\u9898\/\u58f0\u660e\u4f5c\u4e3a\u8f93\u5165\uff0c\u800c\u65e0\u6cd5\u8bbf\u95ee\u652f\u6301\u6bb5\u843d\uff0c\u5e76\u4e14\u5fc5\u987b\u4f9d\u8d56\u5b83\u4eec\u7684\u5185\u90e8\u77e5\u8bc6\u6216\u901a\u8fc7\u4e0e\u5916\u90e8\u73af\u5883\u4ea4\u4e92\u6765\u68c0\u7d22\u77e5\u8bc6\u4ee5\u652f\u6301\u63a8\u7406\u3002<\/p>\n<p><strong>\u884c\u52a8\u7a7a\u95f4\uff08Action Space\uff09<\/strong>\u00a0\u6211\u4eec\u8bbe\u8ba1\u4e86\u4e00\u4e2a\u7b80\u5355\u7684\u7ef4\u57fa\u767e\u79d1Web API\uff0c\u5305\u542b\u4e09\u79cd\u7c7b\u578b\u7684\u64cd\u4f5c\u6765\u652f\u6301\u4ea4\u4e92\u5f0f\u4fe1\u606f\u68c0\u7d22\uff1a<\/p>\n<p>(1) <strong>\u641c\u7d22<\/strong> [\u5b9e\u4f53]\uff0c\u5982\u679c\u5b58\u5728\uff0c\u5219\u4ece\u5bf9\u5e94\u7684\u5b9e\u4f53 wiki\u9875\u9762\u8fd4\u56de\u524d5\u4e2a\u53e5\u5b50\uff0c\u5426\u5219\u4ece\u7ef4\u57fa\u767e\u79d1\u641c\u7d22\u5f15\u64ce\u5efa\u8bae\u524d5\u4e2a\u76f8\u4f3c\u7684\u5b9e\u4f53\uff0c<\/p>\n<p>(2) <strong>\u67e5\u627e<\/strong> [\u5b57\u7b26\u4e32]\uff0c\u5b83\u5c06\u8fd4\u56de\u5305\u542b\u5b57\u7b26\u4e32\u7684\u9875\u9762\u4e2d\u7684\u4e0b\u4e00\u53e5\u8bdd\uff0c\u6a21\u62df\u6d4f\u89c8\u5668\u4e0a\u7684Ctrl+F\u529f\u80fd\u3002<\/p>\n<p>(3) <strong>\u5b8c\u6210<\/strong> [\u7b54\u6848]\uff0c\u7528\u7b54\u6848\u5b8c\u6210\u5f53\u524d\u4efb\u52a1\u3002\u8be5\u52a8\u4f5c\u7a7a\u95f4\u5927\u591a\u53ea\u80fd\u6839\u636e\u51c6\u786e\u7684\u6bb5\u843d\u540d\u79f0\u68c0\u7d22\u6bb5\u843d\u7684\u4e00\u5c0f\u90e8\u5206\uff0c\u6bd4\u6700\u5148\u8fdb\u7684\u8bcd\u6c47\u6216\u795e\u7ecf\u68c0\u7d22\u5668\u5f31\u5f97\u591a\u3002\u5176\u76ee\u7684\u662f\u6a21\u62df\u4eba\u7c7b\u5982\u4f55\u4e0e\u7ef4\u57fa\u767e\u79d1\u4e92\u52a8\uff0c\u5e76\u8feb\u4f7f\u6a21\u578b\u901a\u8fc7\u8bed\u8a00\u7684\u663e\u5f0f\u63a8\u7406\u8fdb\u884c\u68c0\u7d22\u3002<\/p>\n<p>&nbsp;<\/p>\n<h3>3.2 \u65b9\u6cd5<\/h3>\n<p><strong>ReAct Prompting<\/strong> \u5e94\u7528\u4e8e\u4e8eHotpotQA\u548cFever\uff0c\u6211\u4eec\u4ece\u8bad\u7ec3\u96c6\u4e2d\u968f\u673a\u9009\u62e9\u4e866\u4e2a\u548c3\u4e2a\u6848\u4f8b\uff0c\u5e76\u624b\u52a8\u7f16\u5199ReAct -\u683c\u5f0f\u7684\u8f68\u8ff9\uff0c\u4ee5\u7528\u4f5c\u63d0\u793a\u4e2d\u7684\u5c11\u6837\u672c\u6837\u672c\u3002\u7c7b\u4f3c\u4e8e\u56fe1 (d)\uff0c\u6bcf\u4e2a\u8f68\u8ff9\u7531\u591a\u4e2a\u601d\u60f3-\u884c\u52a8-\u89c2\u5bdf\uff08 thought-action-observation\uff09\u6b65\u9aa4\u7ec4\u6210(\u5373 \u5bc6\u96c6\u601d\u7ef4)\uff0c\u5176\u4e2d\u81ea\u7531\u5f62\u5f0f\u7684\u601d\u60f3\u7528\u4e8e\u5404\u79cd\u76ee\u7684\u3002\u5177\u4f53\u6765\u8bf4\uff0c\u6211\u4eec\u4f7f\u7528\u601d\u60f3\u7684\u7ec4\u5408\u6765\u5206\u89e3\u95ee\u9898(\u201c\u6211\u9700\u8981\u641c\u7d22x\uff0c\u627e\u5230y\uff0c\u7136\u540e\u627e\u5230z\u201d)\uff0c\u4ece\u7ef4\u57fa\u767e\u79d1\u89c2\u5bdf\u4e2d\u63d0\u53d6\u4fe1\u606f(\u201cx\u59cb\u4e8e1844\u5e74\u201d\uff0c\u201c\u8be5\u6bb5\u843d\u6ca1\u6709\u544a\u8bc9x\u201d)\uff0c\u6267\u884c\u5e38\u8bc6(\u201cx\u4e0d\u662fy\uff0c\u6240\u4ee5z\u5fc5\u987b\u662f&#8230;&#8230;\u201d)\u6216\u7b97\u672f\u63a8\u7406(\u201c1844 &lt; 1989\u201d)\uff0c\u6307\u5bfc\u641c\u7d22\u91cd\u6784(\u201c\u201c\u4e5f\u8bb8\u6211\u53ef\u4ee5\u641c\u7d22\/\u67e5\u627ex\u201d)\uff0c\u5e76\u5408\u6210\u6700\u7ec8\u7b54\u6848(\u201c\u201c&#8230;&#8230;\u6240\u4ee5\u7b54\u6848\u662fx\u201d)\u3002\u66f4\u591a\u7ec6\u8282\u8bf7\u53c2\u89c1\u9644\u5f55C\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>Baselines<\/strong> \u6211\u4eec\u7cfb\u7edf\u5730\u5220\u9664ReAct\u8f68\u8ff9\u4ee5\u6784\u5efa\u591a\u4e2a\u57fa\u7ebf\u7684\u63d0\u793a(\u683c\u5f0f\u5982\u56fe1 (1a-1c)):<\/p>\n<p>(a)<strong>\u6807\u51c6\u63d0\u793a\/Standard prompting<\/strong>(Standard)\uff0c\u5220\u9664ReAct\u8f68\u8ff9\u4e2d\u7684\u6240\u6709\u60f3\u6cd5\u3001\u884c\u52a8\u3001\u89c2\u5bdf\u3002<\/p>\n<p>(b)<strong>\u601d\u7ef4\u94fe\u63d0\u793a\/Chain-of-thought prompting<\/strong>(CoT) \uff0c\u5b83\u5220\u9664\u4e86\u884c\u52a8\u548c\u89c2\u5bdf\uff0c\u53ea\u4f5c\u4e3a\u63a8\u7406\u7684\u57fa\u7ebf\u3002\u901a\u8fc7\u5728\u63a8\u7406\u8fc7\u7a0b\u4e2d\u91c7\u683721 CoT\u89e3\u7801\u6e29\u5ea6\u4e3a0.7\u7684\u8f68\u8ff9\uff0c\u5e76\u91c7\u7528\u591a\u6570\u7b54\u6848\uff0c\u5efa\u7acb\u4e86\u4e00\u4e2a\u81ea\u4e00\u81f4\u7684\u57fa\u7ebf(CoT-SC) \uff0c\u53d1\u73b0\u8fd9\u59cb\u7ec8\u6bd4CoT\u63d0\u9ad8\u6027\u80fd\u3002<\/p>\n<p>(c)<strong>\u4ec5\u884c\u52a8\u63d0\u793a\/Acting-only prompt<\/strong>(Act)\uff0c\u5b83\u5220\u9664\u4e86ReAct\u8f68\u8ff9\u4e2d\u7684\u60f3\u6cd5\uff0c\u5927\u81f4\u7c7b\u4f3c\u4e8eWebGPT\u5982\u4f55\u4e0e\u4e92\u8054\u7f51\u4ea4\u4e92\u4ee5\u56de\u7b54\u95ee\u9898\uff0c\u5c3d\u7ba1\u5b83\u5728\u4e0d\u540c\u7684\u4efb\u52a1\u548c\u884c\u52a8\u7a7a\u95f4\u4e0a\u64cd\u4f5c\uff0c\u5e76\u4f7f\u7528\u6a21\u4eff\u548c\u5f3a\u5316\u5b66\u4e60\u800c\u4e0d\u662f\u63d0\u793a\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>\u7ed3\u5408\u5185\u90e8\u4e0e\u5916\u90e8\u77e5\u8bc6\/Combining Internal and External Knowledge<\/strong> \u6211\u4eec\u5c06\u57283.3\u8282\u4e2d\u8be6\u7ec6\u4ecb\u7ecd\uff0c\u6211\u4eec\u89c2\u5bdf\u5230<span style=\"color: #ff6600;\">ReAct\u6f14\u793a\u7684\u95ee\u9898\u89e3\u51b3\u8fc7\u7a0b\u66f4\u7b26\u5408\u4e8b\u5b9e\u548c\u6839\u636e\uff0c\u800cCoT\u5728\u5236\u5b9a\u63a8\u7406\u7ed3\u6784\u65b9\u9762\u66f4\u51c6\u786e\uff0c\u4f46\u5f88\u5bb9\u6613\u4ea7\u751f\u5e7b\u89c9\u3002<\/span>\u56e0\u6b64\uff0c\u6211\u4eec\u5efa\u8bae\u5408\u5e76ReAct\u548cCoT-SC\uff0c\u5e76\u8ba9\u6a21\u578b\u6839\u636e\u4ee5\u4e0b\u542f\u53d1\u5f0f\u65b9\u6cd5\u51b3\u5b9a\u4f55\u65f6\u5207\u6362\u5230\u5176\u4ed6\u65b9\u6cd5:<\/p>\n<p>a) <strong>ReAct<\/strong>\u2192<strong>CoT-SC<\/strong>:\u5f53ReAct\u5728\u7ed9\u5b9a\u7684\u6b65\u9aa4\u5185\u65e0\u6cd5\u8fd4\u56de\u7b54\u6848\u65f6\uff0c\u9000\u56de\u5230CoT-SC\u3002\u6211\u4eec\u4e3aHotpotQA\u548cFEVER\u5206\u522b\u8bbe\u7f6e\u4e867\u548c5\u4e2a\u6b65\u9aa4\uff0c\u56e0\u4e3a\u6211\u4eec\u53d1\u73b0\u66f4\u591a\u6b65\u9aa4\u4e0d\u4f1a\u63d0\u9ad8ReAct\u6027\u80fd\u3002<\/p>\n<p>b) <strong>CoT-SC<\/strong>\u2192<strong>ReAct<\/strong>:\u5f53<em>n<\/em>CoT-SC\u6837\u672c\u4e2d\u7684\u5927\u591a\u6570\u7b54\u6848\u51fa\u73b0\u7684\u6b21\u6570\u5c11\u4e8e<em>n\/<\/em>2\u6b21\u65f6(\u5373\uff1a\u5185\u90e8\u77e5\u8bc6\u53ef\u80fd\u65e0\u6cd5\u81ea\u4fe1\u5730\u652f\u6301\u4efb\u52a1)\uff0c\u8bf7\u9000\u56de\u5230ReAct\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>\u5fae\u8c03\/Finetuning<\/strong> \u7531\u4e8e\u5927\u89c4\u6a21\u624b\u52a8\u6807\u6ce8\u63a8\u7406\u8f68\u8ff9\u548c\u52a8\u4f5c\u7684\u6311\u6218\uff0c\u672c\u6587\u8003\u8651\u4e00\u79cd\u7c7b\u4f3c\u4e8eZelikman et al. (2022)\u7684\u81ea\u52a9\u65b9\u6cd5\uff0c\u4f7f\u7528ReAct(\u4e5f\u7528\u4e8e\u5176\u4ed6\u57fa\u7ebf)\u751f\u6210\u76843000\u4e2a\u5177\u6709\u6b63\u786e\u7b54\u6848\u7684\u8f68\u8ff9\u6765\u5fae\u8c03\u8f83\u5c0f\u7684\u8bed\u8a00\u6a21\u578b(PaLM-8\/62B)\uff0c\u4ee5\u89e3\u7801\u4ee5\u8f93\u5165\u95ee\u9898\/\u58f0\u660e\u4e3a\u6761\u4ef6\u7684\u8f68\u8ff9(\u6240\u6709\u60f3\u6cd5\u3001\u884c\u52a8\u3001\u89c2\u5bdf)\u3002\u66f4\u591a\u7ec6\u8282\u89c1\u9644\u5f55B.1\u3002<\/p>\n<p>&nbsp;<\/p>\n<h3>3.3 \u7ed3\u679c\u4e0e\u89c2\u5bdf<\/h3>\n<p><strong>ReAct\u6574\u4f53\u8d85\u8d8aAct\/ReAct outperforms Act consistently<\/strong> \u88681\u663e\u793a\u4e86\u4f7f\u7528PaLM-540B\u4f5c\u4e3a\u57fa\u7840\u6a21\u578b\u5e76\u4f7f\u7528\u4e0d\u540c\u63d0\u793a\u65b9\u6cd5\u7684HotpotQA\u548cFever\u7ed3\u679c\u3002\u6211\u4eec\u6ce8\u610f\u5230ReAct\u5728\u4e24\u4e2a\u4efb\u52a1\u4e0a\u90fd\u4f18\u4e8eAct\uff0c\u8bc1\u660e\u4e86\u63a8\u7406\u6307\u5bfc\u884c\u52a8\u7684\u4ef7\u503c\uff0c\u7279\u522b\u662f\u5728\u5408\u6210\u6700\u7ec8\u7b54\u6848\u65b9\u9762\uff0c\u5982\u56fe1 (1c-d)\u6240\u793a\u3002\u5fae\u8c03\u7ed3\u679c3\u4e5f\u8bc1\u5b9e\u4e86\u63a8\u7406\u75d5\u8ff9\u5bf9\u66f4\u660e\u667a\u7684\u884c\u52a8\u7684\u597d\u5904\u3002<\/p>\n<p>&nbsp;<\/p>\n<div style=\"width: 670px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2597\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-2\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/7f5ae66ca45845a.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-2\" width=\"660\" height=\"450\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/7f5ae66ca45845a.png 660w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/7f5ae66ca45845a-300x205.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/7f5ae66ca45845a-220x150.png 220w\" sizes=\"auto, (max-width: 660px) 100vw, 660px\" \/><p class=\"wp-caption-text\">\u88681\uff1aPaLM-540B\u5728HotpotQA\u548cFever\u4e0a\u7684\u63d0\u793a\u7ed3\u679c\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<p><strong>ReAct <\/strong>vs. <strong>CoT <\/strong>\u53e6\u4e00\u65b9\u9762\uff0cReAct\u5728Fever\u4e0a\u4f18\u4e8eCoT(60.9\u6bd4 56.3)\uff0c\u5728HotpotQA\u4e0a\u7565\u843d\u540e\u4e8eCoT(27.4\u6bd4 29.4)\u3002\u5bf9\u4e8e\u652f\u6301\/\u53cd\u9a73\u7684\u72c2\u70ed\u58f0\u660e\u53ef\u80fd\u53ea\u6709\u5fae\u5c0f\u7684\u5dee\u522b(\u53c2\u89c1\u9644\u5f55D.1)\uff0c\u56e0\u6b64\u91c7\u53d6\u884c\u52a8\u83b7\u53d6\u51c6\u786e\u548c\u6700\u65b0\u7684\u77e5\u8bc6\u81f3\u5173\u91cd\u8981\u3002\u4e3a\u4e86\u66f4\u597d\u5730\u7406\u89e3HotpotQA\u4e0aReAct\u548cCoT\u4e4b\u95f4\u7684\u884c\u4e3a\u5dee\u5f02\uff0c\u6211\u4eec\u5206\u522b\u4eceReAct\u548cCoT(\u5171200\u4e2a\u793a\u4f8b)\u4e2d\u968f\u673a\u62bd\u683750\u4e2a\u7b54\u6848\u6b63\u786e\u548c\u9519\u8bef\u7684\u8f68\u8ff9(EM\u5224\u65ad)\uff0c\u5e76\u5728\u88682\u4e2d\u624b\u52a8\u6807\u8bb0\u5b83\u4eec\u7684\u6210\u529f\u548c\u5931\u8d25\u6a21\u5f0f\u3002\u4ee5\u4e0b\u662f\u4e00\u4e9b\u5173\u952e\u7684\u89c2\u5bdf\u7ed3\u679c\u3002<\/p>\n<p>&nbsp;<\/p>\n<div style=\"width: 1439px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2530\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-3\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cabb96aa55301dd.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-3\" width=\"1429\" height=\"269\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cabb96aa55301dd.png 1429w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cabb96aa55301dd-300x56.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cabb96aa55301dd-1024x193.png 1024w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cabb96aa55301dd-768x145.png 768w\" sizes=\"auto, (max-width: 1429px) 100vw, 1429px\" \/><p class=\"wp-caption-text\">\u8868 2\uff1aReAct \u548c CoT \u5728 HotpotQA \u4e0a\u7684\u6210\u529f\u548c\u5931\u8d25\u6a21\u5f0f\u7c7b\u578b\uff0c\u4ee5\u53ca\u5b83\u4eec\u5728\u4eba\u7c7b\u7814\u7a76\u7684\u968f\u673a\u9009\u62e9\u7684\u4f8b\u5b50\u4e2d\u7684\u767e\u5206\u6bd4\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<p><strong>A) \u5e7b\u89c9\u5bf9\u4e8eCoT\u6765\u8bf4\u662f\u4e00\u4e2a\u4e25\u91cd\u7684\u95ee\u9898<\/strong>\uff0c\u5728\u6210\u529f\u6a21\u5f0f\u4e0b\u5bfc\u81f4\u5176\u8bef\u62a5\u7387\u8fdc\u9ad8\u4e8eReAct\uff0814%\u5bf9\u6bd46%\uff09\uff0c\u5e76\u4e14\u6784\u6210\u4e86\u5176\u4e3b\u8981\u7684\u5931\u8d25\u6a21\u5f0f\uff0856%\uff09\u3002\u76f8\u6bd4\u4e4b\u4e0b\uff0c\u7531\u4e8e\u80fd\u591f\u63a5\u5165\u5916\u90e8\u77e5\u8bc6\u5e93\uff0cReAct\u7684\u95ee\u9898\u89e3\u51b3\u8f68\u8ff9\u66f4\u52a0\u8d34\u8fd1\u5b9e\u9645\u3001\u4ee5\u4e8b\u5b9e\u4e3a\u9a71\u52a8\uff0c\u5e76\u4e14\u66f4\u52a0\u53ef\u4fe1\u3002<\/p>\n<p><strong>B) \u867d\u7136\u4ea4\u9519\u63a8\u7406\u3001\u884c\u52a8\u548c\u89c2\u5bdf\u6b65\u9aa4\u63d0\u9ad8\u4e86ReAct\u7684\u5b9e\u9645\u6027\u548c\u53ef\u4fe1\u5ea6\uff0c\u4f46\u8fd9\u79cd\u7ed3\u6784\u6027\u7ea6\u675f\u4e5f\u964d\u4f4e\u4e86\u5b83\u5728\u5236\u5b9a\u63a8\u7406\u6b65\u9aa4\u65f6\u7684\u7075\u6d3b\u6027<\/strong>\uff0c\u5bfc\u81f4\u5176\u63a8\u7406\u9519\u8bef\u7387\u9ad8\u4e8eCoT\u3002\u6211\u4eec\u6ce8\u610f\u5230ReAct\u6709\u4e00\u4e2a\u7279\u5b9a\u7684\u9891\u7e41\u9519\u8bef\u6a21\u5f0f\uff0c\u5373\u6a21\u578b\u91cd\u590d\u751f\u6210\u4e4b\u524d\u7684\u60f3\u6cd5\u548c\u884c\u52a8\uff0c\u6211\u4eec\u5c06\u5176\u5f52\u7c7b\u4e3a\u201c\u63a8\u7406\u9519\u8bef\u201d\u7684\u4e00\u90e8\u5206\uff0c\u56e0\u4e3a\u6a21\u578b\u672a\u80fd\u63a8\u7406\u51fa\u9002\u5f53\u7684\u4e0b\u4e00\u4e2a\u884c\u52a8\u5e76\u8df3\u51fa\u5faa\u73af\u3002<\/p>\n<p><strong>C) \u5bf9\u4e8eReAct\u6765\u8bf4\uff0c\u901a\u8fc7\u641c\u7d22\u6210\u529f\u68c0\u7d22\u5230\u4fe1\u606f\u6027\u77e5\u8bc6\u81f3\u5173\u91cd\u8981\u3002<\/strong>\u975e\u4fe1\u606f\u6027\u641c\u7d22\u5360\u9519\u8bef\u6848\u4f8b\u768423%\uff0c\u4f7f\u6a21\u578b\u63a8\u7406\u8131\u8f68\uff0c\u5e76\u4f7f\u5176\u96be\u4ee5\u6062\u590d\u548c\u91cd\u65b0\u6784\u601d\u60f3\u6cd5\u3002\u8fd9\u53ef\u80fd\u662f\u4e8b\u5b9e\u6027\u548c\u7075\u6d3b\u6027\u4e4b\u95f4\u9884\u671f\u7684\u6743\u8861\uff0c\u8fd9\u4e5f\u6fc0\u53d1\u4e86\u6211\u4eec\u63d0\u51fa\u7ed3\u5408\u4e24\u79cd\u65b9\u6cd5\u7684\u7b56\u7565\u3002<\/p>\n<p>\u6211\u4eec\u5728\u9644\u5f55E.1\u4e2d\u4e3a\u6bcf\u79cd\u6210\u529f\u548c\u5931\u8d25\u6a21\u5f0f\u63d0\u4f9b\u4e86\u793a\u4f8b\u3002\u6211\u4eec\u8fd8\u53d1\u73b0\u4e00\u4e9bHotpotQA\u95ee\u9898\u53ef\u80fd\u5305\u542b\u8fc7\u65f6\u7684\u7b54\u6848\u6807\u7b7e\uff0c\u89c1\u56fe4\u793a\u4f8b\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>ReAct + CoT-SC\u5728\u63d0\u793aLLMs\u65b9\u9762\u8868\u73b0\u6700\u597d\u3002<\/strong>\u5982\u88681\u6240\u793a\uff0cHotpotQA\u548cFever\u4e0a\u6700\u597d\u7684\u63d0\u793a\u65b9\u6cd5\u5206\u522b\u662fReAct \u2192 CoT-SC\u548cCoT-SC \u2192 ReAct\u3002\u6b64\u5916\uff0c\u56fe2\u5c55\u793a\u4e86\u4e0d\u540c\u65b9\u6cd5\u5728\u4f7f\u7528\u4e0d\u540c\u6570\u91cfCoT-SC\u6837\u672c\u65f6\u7684\u8868\u73b0\u3002\u867d\u7136\u4e24\u79cdReAct + CoT-SC\u65b9\u6cd5\u5728\u5404\u81ea\u7684\u4efb\u52a1\u4e2d\u6709\u4f18\u52bf\uff0c\u4f46\u4ed6\u4eec\u90fd\u663e\u8457\u4e14\u4e00\u81f4\u5730\u4f18\u4e8eCoT-SC\uff0c\u5728\u4e0d\u540c\u6570\u91cf\u7684\u6837\u672c\u4e2d\uff0c\u53ea\u4f7f\u75283-5\u4e2a\u6837\u672c\u5c31\u80fd\u8fbe\u5230CoT-SC\u7684\u8868\u73b0\uff0c\u8fd9\u4e2a\u7ed3\u679c\u8868\u660e\u4e86\u9002\u5f53\u7ed3\u5408\u6a21\u578b\u5185\u90e8\u77e5\u8bc6\u548c\u5916\u90e8\u77e5\u8bc6\u5bf9\u4e8e\u63a8\u7406\u4efb\u52a1\u7684\u4ef7\u503c\u3002<\/p>\n<p>&nbsp;<\/p>\n<div style=\"width: 1219px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2599\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-4\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/c4aae4d455245f1.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-4\" width=\"1209\" height=\"574\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/c4aae4d455245f1.png 1209w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/c4aae4d455245f1-300x142.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/c4aae4d455245f1-1024x486.png 1024w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/c4aae4d455245f1-768x365.png 768w\" sizes=\"auto, (max-width: 1209px) 100vw, 1209px\" \/><p class=\"wp-caption-text\">\u56fe 2\uff1a\u6839\u636e\u4f7f\u7528\u7684CoT-SC\u6837\u672c\u6570\u91cf\u5c55\u793a\u7684PaLM-540B\u63d0\u793a\u7ed3\u679c\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<p><strong>ReAct\u5728\u5fae\u8c03\u65b9\u9762\u8868\u73b0\u6700\u4f18\u3002<\/strong>\u56fe3\u663e\u793a\u4e86\u56db\u79cd\u65b9\u6cd5\uff08Standard, CoT, Act, ReAct\uff09\u5728HotpotQA\u4e0a\u7684\u63d0\u793a\/\u5fae\u8c03\u7684\u6269\u5c55\u6548\u5e94\u3002\u5728PaLM-8\/62B\u4e2d\uff0c\u7531\u4e8e\u4ece\u60c5\u666f\u4e2d\u5b66\u4e60\u63a8\u7406\u548c\u884c\u52a8\u7684\u96be\u5ea6\uff0c\u63d0\u793aReAct\u7684\u8868\u73b0\u662f\u56db\u79cd\u65b9\u6cd5\u4e2d\u6700\u5dee\u7684\u3002\u7136\u800c\uff0c\u5f53\u4ec5\u75283,000\u4e2a\u4f8b\u5b50\u5fae\u8c03\u65f6\uff0cReAct\u6210\u4e3a\u56db\u79cd\u65b9\u6cd5\u4e2d\u6700\u597d\u7684\uff0c\u5176\u4e2dPaLM-8B\u5fae\u8c03ReAct\u7684\u8868\u73b0\u4f18\u4e8e\u6240\u6709PaLM-62B\u7684\u63d0\u793a\u65b9\u6cd5\uff0c\u800cPaLM-62B\u5fae\u8c03ReAct\u7684\u8868\u73b0\u4f18\u4e8e\u6240\u6709540B\u7684\u63d0\u793a\u65b9\u6cd5\u3002\u76f8\u6bd4\u4e4b\u4e0b\uff0c\u5fae\u8c03Standard\u6216CoT\u7684\u8868\u73b0\u663e\u8457\u5730\u5dee\u4e8e\u5fae\u8c03ReAct\u6216Act\uff0c\u5728PaLM8\/62B\u4e2d\uff0c\u524d\u8005\u4e3b\u8981\u6559\u6a21\u578b\u8bb0\u5fc6\uff08\u53ef\u80fd\u662f\u865a\u6784\u7684\uff09\u77e5\u8bc6\u4e8b\u5b9e\uff0c\u540e\u8005\u6559\u6a21\u578b\u5982\u4f55\uff08\u63a8\u7406\u548c\uff09\u884c\u52a8\u4ece\u7ef4\u57fa\u767e\u79d1\u83b7\u53d6\u4fe1\u606f\uff0c\u8fd9\u662f\u4e00\u9879\u66f4\u5177\u666e\u904d\u6027\u7684\u77e5\u8bc6\u63a8\u7406\u6280\u80fd\u3002\u7531\u4e8e\u6240\u6709\u7684\u63d0\u793a\u65b9\u6cd5\u90fd\u8fd8\u663e\u8457\u5730\u4f4e\u4e8e\u9886\u57df\u7279\u5b9a\u7684\u6700\u5148\u8fdb\u65b9\u6cd5\uff08\u88681\uff09\uff0c\u6211\u4eec\u76f8\u4fe1\uff0c\u4f7f\u7528\u66f4\u591a\u4eba\u7c7b\u5199\u7684\u6570\u636e\u8fdb\u884c\u5fae\u8c03\u53ef\u80fd\u662f\u91ca\u653eReAct\u80fd\u529b\u7684\u66f4\u597d\u65b9\u5f0f\u3002<\/p>\n<p>&nbsp;<\/p>\n<div style=\"width: 1021px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2531\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-5\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/d75e8c67887a6cc.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-5\" width=\"1011\" height=\"401\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/d75e8c67887a6cc.png 1011w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/d75e8c67887a6cc-300x119.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/d75e8c67887a6cc-768x305.png 768w\" sizes=\"auto, (max-width: 1011px) 100vw, 1011px\" \/><p class=\"wp-caption-text\">\u56fe3\uff1a\u4f7f\u7528ReAct\uff08\u6211\u4eec\u7684\u65b9\u6cd5\uff09\u548c\u57fa\u7ebf\u5bf9HotPotQA\u8fdb\u884c\u63d0\u793a\u548c\u5fae\u8c03\u7684\u6269\u5c55\u7ed3\u679c\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>4 \u51b3\u7b56\u4efb\u52a1<\/h2>\n<p>&nbsp;<\/p>\n<p>\u6211\u4eec\u8fd8\u5bf9ReAct\u5728\u4e24\u4e2a\u57fa\u4e8e\u8bed\u8a00\u7684\u4ea4\u4e92\u5f0f\u51b3\u7b56\u4efb\u52a1\u4e0a\u8fdb\u884c\u4e86\u6d4b\u8bd5\uff0c\u5373ALFWorld\u548cWebShop\uff0c\u8fd9\u4e24\u4e2a\u4efb\u52a1\u90fd\u5177\u6709\u590d\u6742\u7684\u73af\u5883\uff0c\u9700\u8981\u667a\u80fd\u4f53\u5728\u957f\u65f6\u95f4\u8de8\u5ea6\u5185\u91c7\u53d6\u884c\u52a8\uff0c\u4e14\u5956\u52b1\u7a00\u758f\uff0c\u8fd9\u5c31\u9700\u8981\u667a\u80fd\u4f53\u8fdb\u884c\u6709\u6548\u63a8\u7406\u4ee5\u91c7\u53d6\u884c\u52a8\u548c\u63a2\u7d22\u3002<\/p>\n<p><strong>ALFWorld<\/strong> ALFWorld\uff08\u56fe1(2)\uff09\u662f\u4e00\u4e2a\u5408\u6210\u7684\u57fa\u4e8e\u6587\u672c\u7684\u6e38\u620f\uff0c\u65e8\u5728\u4e0e\u4f53\u73b0\u6027\u7684ALFRED\u57fa\u51c6\u4fdd\u6301\u4e00\u81f4\u3002\u5b83\u5305\u62ec6\u79cd\u7c7b\u578b\u7684\u4efb\u52a1\uff0c\u5176\u4e2d\u667a\u80fd\u4f53\u9700\u8981\u901a\u8fc7\u6587\u672c\u884c\u52a8\uff08\u4f8b\u5982\uff0c\u524d\u5f80\u5496\u5561\u684c1\uff0c\u62ff\u8d77\u6587\u4ef62\uff0c\u4f7f\u7528\u53f0\u706f1\uff09\u5bfc\u822a\u548c\u4e0e\u6a21\u62df\u5bb6\u5ead\u4e92\u52a8\u6765\u5b9e\u73b0\u9ad8\u7ea7\u76ee\u6807\uff08\u4f8b\u5982\uff0c\u5728\u53f0\u706f\u4e0b\u68c0\u67e5\u6587\u4ef6\uff09\u3002\u4e00\u4e2a\u4efb\u52a1\u5b9e\u4f8b\u53ef\u4ee5\u6709\u8d85\u8fc750\u4e2a\u4f4d\u7f6e\uff0c\u5e76\u4e14\u9700\u8981\u4e13\u5bb6\u7b56\u7565\u8d85\u8fc750\u6b65\u624d\u80fd\u89e3\u51b3\uff0c\u8fd9\u5bf9\u667a\u80fd\u4f53\u63d0\u51fa\u4e86\u6311\u6218\uff0c\u8981\u6c42\u5176\u89c4\u5212\u548c\u8ddf\u8e2a\u5b50\u76ee\u6807\uff0c\u4ee5\u53ca\u7cfb\u7edf\u5730\u63a2\u7d22\uff08\u4f8b\u5982\uff0c\u9010\u4e2a\u68c0\u67e5\u6240\u6709\u684c\u5b50\u5bfb\u627e\u53f0\u706f\uff09\u3002\u7279\u522b\u662f\uff0cALFWorld\u5185\u7f6e\u7684\u4e00\u4e2a\u6311\u6218\u662f\u9700\u8981\u786e\u5b9a\u5e38\u89c1\u5bb6\u7528\u7269\u54c1\u7684\u53ef\u80fd\u4f4d\u7f6e\uff08\u4f8b\u5982\uff0c\u53f0\u706f\u5f88\u53ef\u80fd\u5728\u684c\u5b50\u4e0a\u3001\u67b6\u5b50\u4e0a\u6216\u68b3\u5986\u53f0\u4e0a\uff09\uff0c\u8fd9\u4f7f\u5f97\u8fd9\u4e2a\u73af\u5883\u975e\u5e38\u9002\u5408LLM\u5229\u7528\u5176\u9884\u8bad\u7ec3\u7684\u5e38\u8bc6\u77e5\u8bc6\u3002\u4e3a\u4e86\u63d0\u793aReAct\uff0c\u6211\u4eec\u968f\u673a\u6ce8\u91ca\u4e86\u6bcf\u79cd\u4efb\u52a1\u7c7b\u578b\u7684\u8bad\u7ec3\u96c6\u4e2d\u7684\u4e09\u6761\u8f68\u8ff9\uff0c\u6bcf\u6761\u8f68\u8ff9\u5305\u62ec\u7a00\u758f\u7684\u60f3\u6cd5\uff0c\u8fd9\u4e9b\u60f3\u6cd5\uff081\uff09\u5206\u89e3\u76ee\u6807\uff0c\uff082\uff09\u8ddf\u8e2a\u5b50\u76ee\u6807\u5b8c\u6210\u60c5\u51b5\uff0c\uff083\uff09\u786e\u5b9a\u4e0b\u4e00\u4e2a\u5b50\u76ee\u6807\uff0c\u4ee5\u53ca\uff084\uff09\u901a\u8fc7\u5e38\u8bc6\u63a8\u7406\u627e\u5230\u7269\u4f53\u7684\u4f4d\u7f6e\u4ee5\u53ca\u5982\u4f55\u5904\u7406\u5b83\u3002\u6211\u4eec\u5728\u9644\u5f55C.4\u4e2d\u5c55\u793a\u4e86\u7528\u4e8eALFWorld\u7684\u63d0\u793a\u3002\u9075\u5faaShridhar\u7b49\u4eba\u7684\u65b9\u6cd5\uff0c\u6211\u4eec\u5728\u7279\u5b9a\u4efb\u52a1\u8bbe\u7f6e\u4e2d\u8bc4\u4f30\u4e86134\u4e2a\u672a\u89c1\u8fc7\u7684\u8bc4\u4f30\u6e38\u620f\u3002\u4e3a\u4e86\u7a33\u5065\u6027\uff0c\u6211\u4eec\u901a\u8fc7\u6211\u4eec\u6ce8\u91ca\u76843\u6761\u8f68\u8ff9\u4e2d\u7684\u6bcf\u4e24\u6761\u8f68\u8ff9\u7684\u6bcf\u79cd\u6392\u5217\uff0c\u4e3a\u6bcf\u79cd\u4efb\u52a1\u7c7b\u578b\u6784\u5efa\u4e866\u4e2a\u63d0\u793a\u3002Act\u63d0\u793a\u662f\u4f7f\u7528\u76f8\u540c\u7684\u8f68\u8ff9\u6784\u5efa\u7684\uff0c\u4f46\u6ca1\u6709\u60f3\u6cd5\u2014\u2014\u56e0\u4e3a\u4efb\u52a1\u5b9e\u4f8b\u662f\u4ece\u8bad\u7ec3\u96c6\u4e2d\u968f\u673a\u9009\u62e9\u7684\uff0c\u6240\u4ee5\u65e2\u4e0d\u504f\u5411ReAct\u4e5f\u4e0d\u504f\u5411Act\uff0c\u63d0\u4f9b\u4e86\u4e00\u4e2a\u516c\u5e73\u548c\u53d7\u63a7\u7684\u6bd4\u8f83\uff0c\u4ee5\u6d4b\u8bd5\u7a00\u758f\u60f3\u6cd5\u7684\u91cd\u8981\u6027\u3002\u4f5c\u4e3a\u57fa\u7ebf\uff0c\u6211\u4eec\u4f7f\u7528BUTLER\uff0c\u8fd9\u662f\u4e00\u4e2a\u5728\u6bcf\u79cd\u4efb\u52a1\u7c7b\u578b\u7684105\u4e2a\u4e13\u5bb6\u8f68\u8ff9\u4e0a\u8bad\u7ec3\u7684\u6a21\u4eff\u5b66\u4e60\u667a\u80fd\u4f53\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>WebShop<\/strong> ReAct\u662f\u5426\u4e5f\u80fd\u4e0e\u5608\u6742\u7684\u5b9e\u9645\u8bed\u8a00\u73af\u5883\u8fdb\u884c\u4ea4\u4e92\uff0c\u7528\u4e8e\u5b9e\u9645\u5e94\u7528\uff1f\u6211\u4eec\u7814\u7a76\u4e86WebShop\uff0c\u8fd9\u662f\u4e00\u4e2a\u6700\u8fd1\u63d0\u51fa\u7684\u5728\u7ebf\u8d2d\u7269\u7f51\u7ad9\u73af\u5883\uff0c\u62e5\u6709118\u4e07\u771f\u5b9e\u4e16\u754c\u4ea7\u54c1\u548c12k\u4eba\u7c7b\u6307\u4ee4\u3002\u4e0eALFWorld\u4e0d\u540c\uff0cWebshop\u5305\u542b\u5927\u91cf\u7ed3\u6784\u5316\u548c\u975e\u7ed3\u6784\u5316\u7684\u6587\u672c\uff08\u4f8b\u5982\uff0c\u4ece\u4e9a\u9a6c\u900a\u6293\u53d6\u7684\u4ea7\u54c1\u6807\u9898\u3001\u63cf\u8ff0\u548c\u9009\u9879\uff09\uff0c\u5e76\u8981\u6c42\u667a\u80fd\u4f53\u6839\u636e\u7528\u6237\u6307\u4ee4\uff08\u4f8b\u5982\uff0c\u201c\u6211\u6b63\u5728\u5bfb\u627e\u4e00\u4e2a\u5e26\u62bd\u5c49\u7684\u5e8a\u5934\u67dc\u3002\u5b83\u5e94\u8be5\u6709\u954d\u8272\u7684\u5916\u89c2\uff0c\u4ef7\u683c\u4f4e\u4e8e140\u7f8e\u5143\u201d\uff09\u901a\u8fc7\u7f51\u7edc\u4ea4\u4e92\uff08\u4f8b\u5982\uff0c\u641c\u7d22\u201c\u5e8a\u5934\u67dc\u62bd\u5c49\u201d\uff0c\u9009\u62e9\u201c\u989c\u8272\uff1a\u73b0\u4ee3\u954d\u767d\u8272\u201d\u6216\u201c\u8fd4\u56de\u641c\u7d22\u201d\u7b49\u6309\u94ae\uff09\u8d2d\u4e70\u4ea7\u54c1\u3002\u8fd9\u4e2a\u4efb\u52a1\u901a\u8fc7\u5e73\u5747\u5f97\u5206\uff08\u6240\u9009\u4ea7\u54c1\u8986\u76d6\u6240\u9700\u5c5e\u6027\u7684\u767e\u5206\u6bd4\uff0c\u8de8\u6240\u6709\u5267\u96c6\u5e73\u5747\uff09\u548c\u6210\u529f\u7387\uff08\u6240\u9009\u4ea7\u54c1\u6ee1\u8db3\u6240\u6709\u8981\u6c42\u7684\u5267\u96c6\u767e\u5206\u6bd4\uff09\u5728500\u4e2a\u6d4b\u8bd5\u6307\u4ee4\u4e0a\u8fdb\u884c\u8bc4\u4f30\u3002\u6211\u4eec\u5236\u5b9a\u4e86Act\u63d0\u793a\uff0c\u5305\u62ec\u641c\u7d22\u3001\u9009\u62e9\u4ea7\u54c1\u3001\u9009\u62e9\u9009\u9879\u548c\u8d2d\u4e70\u7684\u884c\u52a8\uff0c\u800cReAct\u63d0\u793a\u5219\u989d\u5916\u63a8\u7406\u4ee5\u786e\u5b9a\u63a2\u7d22\u4ec0\u4e48\u3001\u4f55\u65f6\u8d2d\u4e70\uff0c\u4ee5\u53ca\u54ea\u4e9b\u4ea7\u54c1\u9009\u9879\u4e0e\u6307\u4ee4\u76f8\u5173\u3002\u53c2\u89c1\u88686\u7684\u793a\u4f8b\u63d0\u793a\uff0c\u4ee5\u53ca\u9644\u5f55\u4e2d\u7684\u886810\u7684\u6a21\u578b\u9884\u6d4b\u3002\u6211\u4eec\u5c06\u5176\u4e0e\u4e00\u4e2a\u901a\u8fc71012\u4e2a\u4eba\u6ce8\u91ca\u8f68\u8ff9\u8bad\u7ec3\u7684\u6a21\u4eff\u5b66\u4e60\u65b9\u6cd5\uff0c\u4ee5\u53ca\u4e00\u4e2a\u989d\u5916\u901a\u8fc710587\u4e2a\u8bad\u7ec3\u6307\u4ee4\u8bad\u7ec3\u7684\u6a21\u4eff+\u5f3a\u5316\u5b66\u4e60\u65b9\u6cd5\uff08IL + RL\uff09\u8fdb\u884c\u6bd4\u8f83\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>\u7ed3\u679c<\/strong> ReAct\u5728ALFWorld\uff08\u88683\uff09\u548cWebshop\uff08\u88684\uff09\u4e24\u4e2a\u5e73\u53f0\u4e0a\u90fd\u8d85\u8d8a\u4e86Act\u3002\u5728ALFWorld\u4e0a\uff0c\u8868\u73b0\u6700\u4f18\u79c0\u7684ReAct\u5b9e\u9a8c\u5e73\u5747\u6210\u529f\u7387\u8fbe\u523071%\uff0c\u5927\u5927\u8d85\u51fa\u6700\u597d\u7684Act\uff0845%\uff09\u548cBUTLER\uff0837%\uff09\u5b9e\u9a8c\u3002\u5b9e\u9645\u4e0a\uff0c\u8868\u73b0\u6700\u5dee\u7684ReAct\u5b9e\u9a8c\uff0848%\uff09\u4e5f\u8d85\u8fc7\u4e86\u8fd9\u4e24\u79cd\u65b9\u6cd5\u7684\u6700\u4f73\u5b9e\u9a8c\u3002\u6b64\u5916\uff0cReAct\u76f8\u5bf9Act\u7684\u4f18\u52bf\u5728\u516d\u6b21\u53d7\u63a7\u8bd5\u9a8c\u4e2d\u6301\u7eed\u5b58\u5728\uff0c\u76f8\u5bf9\u6027\u80fd\u63d0\u5347\u8303\u56f4\u4ece33%\u523090%\uff0c\u5e73\u5747\u4e3a62%\u3002\u4ece\u5b9a\u6027\u89d2\u5ea6\u6765\u770b\uff0c\u6211\u4eec\u53d1\u73b0Act\u5728\u5b8c\u5168\u6ca1\u6709\u601d\u8003\u7684\u60c5\u51b5\u4e0b\uff0c\u65e0\u6cd5\u6b63\u786e\u5c06\u76ee\u6807\u5206\u89e3\u6210\u66f4\u5c0f\u7684\u5b50\u76ee\u6807\uff0c\u6216\u8005\u5931\u53bb\u4e86\u5bf9\u73af\u5883\u5f53\u524d\u72b6\u6001\u7684\u8ddf\u8e2a\u3002\u53ef\u4ee5\u5728\u9644\u5f55D.2.1\u548c\u9644\u5f55D.2.2\u4e2d\u627e\u5230\u6bd4\u8f83ReAct\u548cAct\u7684\u4f8b\u5b50\u8f68\u8ff9\u3002<\/p>\n<p>&nbsp;<\/p>\n<div style=\"width: 1092px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2607\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-1\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/e2bf752b22c928e.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-1\" width=\"1082\" height=\"390\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/e2bf752b22c928e.png 1082w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/e2bf752b22c928e-300x108.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/e2bf752b22c928e-1024x369.png 1024w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/e2bf752b22c928e-768x277.png 768w\" sizes=\"auto, (max-width: 1082px) 100vw, 1082px\" \/><p class=\"wp-caption-text\">\u88683\uff1aAlfWorld\u4efb\u52a1\u7279\u5b9a\u6210\u529f\u7387\uff08%\uff09\u3002 BUTLER\u548cBUTLERg\u7684\u7ed3\u679c\u6765\u81eaShridhar\u7b49\u4eba\u76842020b\u88684\u3002\u6240\u6709\u65b9\u6cd5\u90fd\u4f7f\u7528\u8d2a\u5a6a\u89e3\u7801\uff0c\u9664\u4e86BUTLER\u4f7f\u7528\u6ce2\u675f\u641c\u7d22\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<div style=\"width: 469px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2532\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-7\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/59dcc4f00aa4b31.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-7\" width=\"459\" height=\"435\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/59dcc4f00aa4b31.png 459w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/59dcc4f00aa4b31-300x284.png 300w\" sizes=\"auto, (max-width: 459px) 100vw, 459px\" \/><p class=\"wp-caption-text\">\u88684\uff1a\u5728Webshop\u4e0a\u7684\u5f97\u5206\u548c\u6210\u529f\u7387\uff08SR\uff09\u3002 IL\/IL+RL\u7684\u6570\u636e\u53d6\u81eaYao\u7b49\u4eba\uff082022\u5e74\uff09\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<p>\u5728Webshop\u4e0a\uff0c\u4e00\u6b21\u6027\u7684Act\u63d0\u793a\u5df2\u7ecf\u80fd\u4e0eIL\u548cIL+RL\u65b9\u6cd5\u5e76\u9a7e\u9f50\u9a71\u3002\u901a\u8fc7\u989d\u5916\u7684\u7a00\u758f\u63a8\u7406\uff0cReAct\u5b9e\u73b0\u4e86\u660e\u663e\u66f4\u597d\u7684\u6027\u80fd\uff0c\u7edd\u5bf9\u503c\u63d0\u5347\u4e8610%\uff0c\u8d85\u8fc7\u4e86\u4e4b\u524d\u7684\u6700\u4f73\u6210\u529f\u7387\u3002\u901a\u8fc7\u68c0\u67e5\u793a\u4f8b\uff0c\u6211\u4eec\u53d1\u73b0ReAct\u66f4\u53ef\u80fd\u901a\u8fc7\u63a8\u7406\u6765\u786e\u5b9a\u4e0e\u6307\u4ee4\u76f8\u5173\u7684\u4ea7\u54c1\u548c\u9009\u9879\uff0c\u4ee5\u5f25\u8865\u5608\u6742\u89c2\u5bdf\u548c\u884c\u52a8\u4e4b\u95f4\u7684\u5dee\u8ddd\uff08\u4f8b\u5982\uff0c\u201c\u5bf9\u4e8e\u2018\u8282\u7701\u7a7a\u95f4\u7684\u751f\u6d3b\u5ba4\u811a\u51f3\u51f3\u5b50\u2019\uff0c\u8be5\u5546\u54c1\u6709\u201839x18x18inch\u2019\u548c\u2018\u84dd\u8272\u2019\u7684\u9009\u9879\uff0c\u770b\u8d77\u6765\u5f88\u503c\u5f97\u8d2d\u4e70\u3002\u201d\uff09\u3002\u7136\u800c\uff0c\u73b0\u6709\u65b9\u6cd5\u7684\u6027\u80fd\u4ecd\u8fdc\u4e0d\u53ca\u4e13\u5bb6\u4eba\u7c7b\uff08\u88684\uff09\uff0c\u4ed6\u4eec\u8fdb\u884c\u7684\u4ea7\u54c1\u63a2\u7d22\u548c\u67e5\u8be2\u91cd\u65b0\u6784\u5efa\u7684\u6570\u91cf\u660e\u663e\u66f4\u591a\uff0c\u5bf9\u4e8e\u57fa\u4e8e\u63d0\u793a\u7684\u65b9\u6cd5\u6765\u8bf4\uff0c\u8fd9\u4ecd\u7136\u662f\u4e00\u4e2a\u6311\u6218\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>\u5173\u4e8e\u5185\u90e8\u63a8\u7406\u4e0e\u5916\u90e8\u53cd\u9988\u7684\u4ef7\u503c<\/strong> \u636e\u6211\u4eec\u6240\u77e5\uff0cReAct\u662f\u7b2c\u4e00\u4e2a\u5c06LLM\u5e94\u7528\u4e8e\u4ea4\u4e92\u5f0f\u73af\u5883\u4e2d\u7684\u95ed\u73af\u7cfb\u7edf\u4e2d\uff0c\u7ed3\u5408\u63a8\u7406\u548c\u884c\u52a8\u7684\u6f14\u793a\u3002\u4e5f\u8bb8\u6700\u63a5\u8fd1\u7684\u5148\u524d\u5de5\u4f5c\u662f\u5185\u90e8\u72ec\u767d\uff08IM\uff09\uff0c\u6765\u81eaHuang\u7b49\u4eba\uff082022b\uff09\uff0c\u5176\u4e2d\u4f53\u73b0\u6027\u4ee3\u7406\u7684\u884c\u52a8\u662f\u7531\u540c\u540d\u7684\u201c\u5185\u90e8\u72ec\u767d\u201d\u6240\u9a71\u52a8\u7684\u3002<strong>\u7136\u800c\uff0cIM\u7684\u201c\u5185\u90e8\u72ec\u767d\u201d\u4ec5\u9650\u4e8e\u5bf9\u73af\u5883\u72b6\u6001\u7684\u89c2\u5bdf\u4ee5\u53ca\u4ee3\u7406\u9700\u8981\u5b8c\u6210\u7684\u4efb\u52a1\uff0c\u4ee5\u6ee1\u8db3\u76ee\u6807\u3002<\/strong>\u76f8\u6bd4\u4e4b\u4e0b\uff0cReAct\u4e2d\u7684\u51b3\u7b56\u63a8\u7406\u8ffd\u8e2a\u662f\u7075\u6d3b\u548c\u7a00\u758f\u7684\uff0c\u5141\u8bb8\u4e3a\u4e0d\u540c\u4efb\u52a1\u8bf1\u5bfc\u51fa\u591a\u6837\u5316\u7684\u63a8\u7406\u7c7b\u578b\uff08\u89c1\u7b2c2\u8282\uff09\u3002<\/p>\n<p>\u4e3a\u4e86\u5c55\u793aReAct\u548cIM\u4e4b\u95f4\u7684\u533a\u522b\uff0c\u5e76\u5f3a\u8c03\u5185\u90e8\u63a8\u7406\u4e0e\u7b80\u5355\u5bf9\u5916\u90e8\u53cd\u9988\u7684\u53cd\u5e94\u7684\u91cd\u8981\u6027\uff0c\u6211\u4eec\u4f7f\u7528\u7531IM\u98ce\u683c\u7684\u5bc6\u96c6\u5916\u90e8\u53cd\u9988\u7ec4\u6210\u7684\u601d\u7ef4\u6a21\u5f0f\u8fdb\u884c\u4e86\u6d88\u878d\u5b9e\u9a8c\u3002\u5982\u88683\u6240\u793a\uff0cReAct\u5927\u5927\u4f18\u4e8eIM\u98ce\u683c\u7684\u63d0\u793a\uff08ReAct-IM\uff09\uff0871%\u5bf9\u6bd453%\u7684\u6574\u4f53\u6210\u529f\u7387\uff09\uff0c\u5728\u516d\u9879\u4efb\u52a1\u4e2d\u7684\u4e94\u9879\u4e0a\u90fd\u6709\u4e00\u81f4\u7684\u4f18\u52bf\u3002\u4ece\u8d28\u91cf\u4e0a\u770b\uff0c\u6211\u4eec\u89c2\u5bdf\u5230ReAct-IM\u5728\u786e\u5b9a\u5b50\u76ee\u6807\u4f55\u65f6\u5b8c\u6210\uff0c\u6216\u8005\u4e0b\u4e00\u4e2a\u5b50\u76ee\u6807\u5e94\u8be5\u662f\u4ec0\u4e48\u65f6\u7ecf\u5e38\u72af\u9519\u8bef\uff0c\u56e0\u4e3a\u7f3a\u4e4f\u9ad8\u5c42\u6b21\u7684\u76ee\u6807\u5206\u89e3\u3002\u6b64\u5916\uff0c\u8bb8\u591aReAct-IM\u8f68\u8ff9\u5728\u786e\u5b9aALFWorld\u73af\u5883\u4e2d\u7269\u54c1\u53ef\u80fd\u7684\u4f4d\u7f6e\u65f6\u4e5f\u9047\u5230\u4e86\u56f0\u96be\uff0c\u56e0\u4e3a\u7f3a\u4e4f\u5e38\u8bc6\u63a8\u7406\u3002<br \/>\n\u8fd9\u4e24\u79cd\u4e0d\u8db3\u90fd\u53ef\u4ee5\u5728ReAct\u8303\u5f0f\u4e2d\u5f97\u5230\u89e3\u51b3\u3002\u5173\u4e8eReAct-IM\u7684\u66f4\u591a\u7ec6\u8282\u5728\u9644\u5f55B.2\u4e2d\u3002ReAct-IM\u7684\u793a\u4f8b\u63d0\u793a\u53ef\u4ee5\u5728\u9644\u5f55C.4\u4e2d\u627e\u5230\uff0c\u793a\u4f8b\u8f68\u8ff9\u5728\u9644\u5f55D.2.3\u4e2d\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>\u00a05 \u76f8\u5173\u5de5\u4f5c<\/h2>\n<p>&nbsp;<\/p>\n<p><strong>\u63a8\u7406\u7684\u8bed\u8a00\u6a21\u578b<\/strong> \u4e5f\u8bb8\u6700\u4e3a\u4eba\u6240\u77e5\u7684\u4f7f\u7528\u5927\u578b\u8bed\u8a00\u6a21\u578b\uff08LLMs\uff09\u8fdb\u884c\u63a8\u7406\u7684\u5de5\u4f5c\u662fChain-of-Thought (CoT)\uff0c\u5b83\u63ed\u793a\u4e86LLMs\u5236\u5b9a\u81ea\u5df1\u7684\u201c\u601d\u8003\u8fc7\u7a0b\u201d\u6765\u89e3\u51b3\u95ee\u9898\u7684\u80fd\u529b\u3002\u6b64\u540e\u5df2\u7ecf\u8fdb\u884c\u4e86\u51e0\u9879\u540e\u7eed\u5de5\u4f5c\uff0c\u5305\u62ec\u7528\u4e8e\u89e3\u51b3\u590d\u6742\u4efb\u52a1\u7684\u6700\u5c11\u81f3\u6700\u591a\u63d0\u793a\uff08least-to-most prompting\uff09\u3001\u96f6\u6837\u672cCoT\uff08zero-shotCoT\uff09\u4ee5\u53ca\u81ea\u6211\u4e00\u81f4\u6027\u63a8\u7406\uff08self-consistency\uff09\u3002\u6700\u8fd1\uff0c(Madaan &amp; Yazdanbakhsh\uff0c2022)\u7cfb\u7edf\u5730\u7814\u7a76\u4e86CoT\u7684\u6784\u5efa\u548c\u7ed3\u6784\uff0c\u5e76\u89c2\u5bdf\u5230\u7b26\u53f7\u3001\u6a21\u5f0f\u548c\u6587\u672c\u7684\u5b58\u5728\u5bf9CoT\u7684\u6709\u6548\u6027\u81f3\u5173\u91cd\u8981\u3002<br \/>\n\u5176\u4ed6\u5de5\u4f5c\u4e5f\u5df2\u7ecf\u6269\u5c55\u5230\u4e86\u66f4\u590d\u6742\u7684\u63a8\u7406\u67b6\u6784\uff0c\u4e0d\u4ec5\u4ec5\u662f\u7b80\u5355\u7684\u63d0\u793a\u3002\u4f8b\u5982\uff0c\u9009\u62e9-\u63a8\u7406\uff08Selection-Inference\uff09\u5c06\u63a8\u7406\u8fc7\u7a0b\u5206\u4e3a\u201c\u9009\u62e9\u201d\u548c\u201c\u63a8\u7406\u201d\u4e24\u4e2a\u6b65\u9aa4\u3002STaR\u901a\u8fc7\u5728\u6a21\u578b\u81ea\u8eab\u751f\u6210\u7684\u6b63\u786e\u63a8\u7406\u57fa\u7840\u4e0a\u5bf9\u6a21\u578b\u8fdb\u884c\u5fae\u8c03\u6765\u5f15\u5bfc\u63a8\u7406\u8fc7\u7a0b\u3002\u5fe0\u5b9e\u63a8\u7406\uff08Faithful reasoning\uff09\u5c06\u591a\u6b65\u9aa4\u63a8\u7406\u5206\u89e3\u4e3a\u4e09\u4e2a\u6b65\u9aa4\uff0c\u6bcf\u4e2a\u6b65\u9aa4\u7531\u4e00\u4e2a\u4e13\u95e8\u7684LM\u5206\u522b\u6267\u884c\u3002\u7c7b\u4f3c\u7684\u65b9\u6cd5\uff0c\u5982Scratchpad\uff0c\u901a\u8fc7\u5728\u4e2d\u95f4\u8ba1\u7b97\u6b65\u9aa4\u4e0a\u5bf9LM\u8fdb\u884c\u5fae\u8c03\uff0c\u4e5f\u5c55\u793a\u4e86\u5728\u591a\u6b65\u9aa4\u8ba1\u7b97\u95ee\u9898\u4e0a\u7684\u6539\u8fdb\u3002<br \/>\n\u4e0e\u8fd9\u4e9b\u65b9\u6cd5\u76f8\u6bd4\uff0cReAct\u6267\u884c\u7684\u4e0d\u4ec5\u4ec5\u662f\u5b64\u7acb\u7684\u3001\u56fa\u5b9a\u7684\u63a8\u7406\uff0c\u5e76\u5c06\u6a21\u578b\u52a8\u4f5c\u53ca\u5176\u5bf9\u5e94\u7684\u89c2\u5bdf\u7ed3\u679c\u6574\u5408\u5230\u4e00\u4e2a\u8fde\u8d2f\u7684\u8f93\u5165\u6d41\u4e2d\uff0c\u4ee5\u4fbf\u6a21\u578b\u66f4\u51c6\u786e\u5730\u8fdb\u884c\u63a8\u7406\uff0c\u5e76\u89e3\u51b3\u8d85\u8d8a\u63a8\u7406\u7684\u4efb\u52a1\uff08\u4f8b\u5982\u4ea4\u4e92\u5f0f\u51b3\u7b56\u5236\u5b9a\uff09\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>\u5c06\u8bed\u8a00\u6a21\u578b\u7528\u4e8e\u51b3\u7b56\u5236\u5b9a\u3002<\/strong> \u5f3a\u5927\u7684LLM\u7684\u80fd\u529b\u4f7f\u5b83\u4eec\u80fd\u591f\u6267\u884c\u8d85\u8d8a\u8bed\u8a00\u751f\u6210\u7684\u4efb\u52a1\uff0c\u5229\u7528LLM\u4f5c\u4e3a\u51b3\u7b56\u5236\u5b9a\u7684\u7b56\u7565\u6a21\u578b\uff0c\u7279\u522b\u662f\u5728\u4ea4\u4e92\u73af\u5883\u4e2d\uff0c\u8fd9\u8d8a\u6765\u8d8a\u53d7\u6b22\u8fce\u3002WebGPT\u4f7f\u7528LM\u4e0e\u7f51\u9875\u6d4f\u89c8\u5668\u8fdb\u884c\u4ea4\u4e92\uff0c\u5bfc\u822a\u7f51\u9875\uff0c\u5e76\u4eceELI5\u4e2d\u63a8\u65ad\u51fa\u5bf9\u590d\u6742\u95ee\u9898\u7684\u7b54\u6848\u3002\u76f8\u6bd4\u4e4b\u4e0b\uff0cWebGPT\u5e76\u672a\u660e\u786e\u5efa\u6a21\u601d\u8003\u548c\u63a8\u7406\u8fc7\u7a0b\uff0c\u800c\u662f\u4f9d\u8d56\u4e8e\u6602\u8d35\u7684\u4eba\u7c7b\u53cd\u9988\u8fdb\u884c\u5f3a\u5316\u5b66\u4e60\u3002\u5728\u5bf9\u8bdd\u5efa\u6a21\u4e2d\uff0c\u50cfBlenderBot\u548cSparrow\u4ee5\u53ca\u9762\u5411\u4efb\u52a1\u7684\u5bf9\u8bdd\u7cfb\u7edf\u5982SimpleTOD\u4e5f\u8bad\u7ec3LM\u6765\u505a\u51fa\u5173\u4e8eAPI\u8c03\u7528\u7684\u51b3\u7b56\u3002\u4e0eReAct\u4e0d\u540c\uff0c\u5b83\u4eec\u6ca1\u6709\u660e\u786e\u8003\u8651\u63a8\u7406\u8fc7\u7a0b\uff0c\u5e76\u4f9d\u8d56\u4e8e\u6602\u8d35\u7684\u6570\u636e\u96c6\u548c\u4eba\u7c7b\u53cd\u9988\u96c6\u5408\u8fdb\u884c\u653f\u7b56\u5b66\u4e60\u3002\u76f8\u53cd\uff0cReAct\u4ee5\u4e00\u79cd\u66f4\u4fbf\u5b9c\u7684\u65b9\u5f0f\u5b66\u4e60\u653f\u7b56\uff0c\u56e0\u4e3a\u51b3\u7b56\u5236\u5b9a\u8fc7\u7a0b\u53ea\u9700\u8981\u8bed\u8a00\u63cf\u8ff0\u63a8\u7406\u8fc7\u7a0b\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>\u8bed\u8a00\u6a21\u578b\uff08LLMs\uff09\u4e5f\u8d8a\u6765\u8d8a\u591a\u5730\u88ab\u5e94\u7528\u4e8e\u4ea4\u4e92\u5f0f\u548c\u5177\u8eab\u73af\u5883\u4e2d\u7684\u89c4\u5212\u548c\u51b3\u7b56\u3002\u5728\u8fd9\u65b9\u9762\uff0c\u4e0eReAct\u6700\u4e3a\u76f8\u5173\u7684\u53ef\u80fd\u662fSayCan\u548c<strong>Inner Monologue\uff08\u5185\u5fc3\u72ec\u767d\uff09<\/strong>\uff0c\u5b83\u4eec\u4f7f\u7528LLMs\u8fdb\u884c\u673a\u5668\u4eba\u7684\u52a8\u4f5c\u89c4\u5212\u548c\u51b3\u7b56\u3002\u5728SayCan\u4e2d\uff0cLLMs\u88ab\u63d0\u793a\u76f4\u63a5\u9884\u6d4b\u673a\u5668\u4eba\u53ef\u80fd\u91c7\u53d6\u7684\u884c\u52a8\uff0c\u7136\u540e\u7531\u57fa\u4e8e\u89c6\u89c9\u73af\u5883\u7684\u53ef\u4f9b\u6027\u6a21\u578b\u91cd\u65b0\u6392\u5e8f\u4ee5\u8fdb\u884c\u6700\u7ec8\u9884\u6d4b\u3002Inner Monologue\u901a\u8fc7\u6dfb\u52a0\u8457\u540d\u7684\u201c\u5185\u5fc3\u72ec\u767d\u201d\u8fdb\u4e00\u6b65\u6539\u8fdb\uff0c\u8be5\u72ec\u767d\u88ab\u5b9e\u73b0\u4e3a\u4ece\u73af\u5883\u4e2d\u6ce8\u5165\u7684\u53cd\u9988\u3002\u636e\u6211\u4eec\u6240\u77e5\uff0cInner Monologue\u662f\u7b2c\u4e00\u4e2a\u5c55\u793a\u8fd9\u79cd\u95ed\u73af\u7cfb\u7edf\u7684\u5de5\u4f5c\uff0cReAct\u5728\u6b64\u57fa\u7840\u4e0a\u8fdb\u884c\u6784\u5efa\u3002\u7136\u800c\uff0c\u6211\u4eec\u8ba4\u4e3aInner Monologue\u5e76\u4e0d\u771f\u6b63\u5305\u542b\u5185\u5fc3\u601d\u7ef4\u2014\u2014\u8fd9\u5728\u7b2c4\u8282\u4e2d\u6709\u8be6\u7ec6\u9610\u8ff0\u3002\u6211\u4eec\u8fd8\u6ce8\u610f\u5230\uff0c\u5728\u4ea4\u4e92\u5f0f\u51b3\u7b56\u8fc7\u7a0b\u4e2d\uff0c\u5c06\u8bed\u8a00\u4f5c\u4e3a\u8bed\u4e49\u4e30\u5bcc\u7684\u8f93\u5165\u5df2\u88ab\u8bc1\u660e\u5728\u5176\u4ed6\u8bbe\u7f6e\u4e0b\u662f\u6210\u529f\u7684\u3002\u8d8a\u6765\u8d8a\u660e\u663e\u7684\u662f\uff0c\u501f\u52a9LLMs\uff0c\u8bed\u8a00\u4f5c\u4e3a\u4e00\u79cd\u57fa\u672c\u7684\u8ba4\u77e5\u673a\u5236\u5c06\u5728\u4ea4\u4e92\u548c\u51b3\u7b56\u4e2d\u53d1\u6325\u5173\u952e\u4f5c\u7528\u3002\u6b64\u5916\uff0cLLMs\u7684\u8fdb\u6b65\u4e5f\u542f\u53d1\u4e86\u50cfReed\u7b49\u4eba\u8fd9\u6837\u591a\u529f\u80fd\u548c\u901a\u7528\u4ee3\u7406\u7684\u53d1\u5c55\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>6 \u7ed3\u8bba<\/h2>\n<p>&nbsp;<\/p>\n<p>\u6211\u4eec\u63d0\u51fa\u4e86ReAct-\u4e00\u79cd\u7b80\u5355\u800c\u6709\u6548\u7684\u65b9\u6cd5\uff0c\u7528\u4e8e\u5728\u5927\u578b\u8bed\u8a00\u6a21\u578b\u4e2d\u534f\u8c03\u63a8\u7406\u548c\u884c\u52a8\u3002\u901a\u8fc7\u5728\u591a\u8df3\u95ee\u9898\u7b54\u6848\u3001\u4e8b\u5b9e\u67e5\u8bc1\u548c\u4ea4\u4e92\u5f0f\u51b3\u7b56\u4efb\u52a1\u4e0a\u7684\u4e00\u7cfb\u5217\u591a\u6837\u5316\u7684\u5b9e\u9a8c\uff0c\u6211\u4eec\u5c55\u793a\u4e86ReAct\u80fd\u591f\u5e26\u6765\u66f4\u4f18\u79c0\u7684\u6027\u80fd\u5e76\u5177\u6709\u53ef\u89e3\u6790\u7684\u51b3\u7b56\u8def\u5f84\u3002\u5c3d\u7ba1\u6211\u4eec\u7684\u65b9\u6cd5\u5f88\u7b80\u5355\uff0c\u4f46\u662f\u5927\u578b\u884c\u52a8\u7a7a\u95f4\u7684\u590d\u6742\u4efb\u52a1\u9700\u8981\u66f4\u591a\u7684\u793a\u4f8b\u624d\u80fd\u5b66\u4e60\u5f97\u597d\uff0c\u8fd9\u5f88\u5bb9\u6613\u8d85\u51fa\u5728\u4e0a\u4e0b\u6587\u5b66\u4e60\u4e2d\u7684\u8f93\u5165\u957f\u5ea6\u9650\u5236\u3002\u6211\u4eec\u5728HotpotQA\u4e0a\u5c1d\u8bd5\u4e86\u5fae\u8c03\u7684\u65b9\u6cd5\uff0c\u521d\u6b65\u7ed3\u679c\u4ee4\u4eba\u9f13\u821e\uff0c\u4f46\u662f\u5728\u66f4\u591a\u9ad8\u8d28\u91cf\u4eba\u7c7b\u6ce8\u89e3\u4e2d\u5b66\u4e60\u5c06\u4f1a\u662f\u8fdb\u4e00\u6b65\u63d0\u9ad8\u6027\u80fd\u7684\u671f\u671b\u3002\u8ba9ReAct\u5728\u591a\u4efb\u52a1\u8bad\u7ec3\u4e2d\u6269\u5927\u89c4\u6a21\uff0c\u548c\u50cf\u5f3a\u5316\u5b66\u4e60\u8fd9\u6837\u7684\u4e92\u8865\u8303\u5f0f\u76f8\u7ed3\u5408\uff0c\u53ef\u80fd\u4f1a\u4ea7\u751f\u66f4\u5f3a\u5927\u7684\u4ee3\u7406\uff0c\u4e3a\u66f4\u591a\u7684\u5e94\u7528\u89e3\u9501LLMs\u7684\u6f5c\u529b\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>A \u9644\u52a0\u7ed3\u8bba<\/h2>\n<p>&nbsp;<\/p>\n<h3>A.1 GPT-3 \u5b9e\u9a8c<\/h3>\n<div style=\"width: 600px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2533\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-8\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/fd479ea6fbef27a.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-8\" width=\"590\" height=\"128\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/fd479ea6fbef27a.png 590w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/fd479ea6fbef27a-300x65.png 300w\" sizes=\"auto, (max-width: 590px) 100vw, 590px\" \/><p class=\"wp-caption-text\">\u88685\uff1a\u4f7f\u7528PaLM-540B\u4e0eGPT-3\uff08text-davinci-002\uff0c\u8d2a\u5a6a\u89e3\u7801\uff09\u8fdb\u884cReAct\u63d0\u793a\u7684\u7ed3\u679c\u5bf9\u6bd4\u3002 \u5728HotpotQA\u4e0a\uff0c\u6211\u4eec\u968f\u673a\u62bd\u53d6\u4e86500\u4e2a\u9a8c\u8bc1\u95ee\u9898\u7684\u5b50\u96c6\u3002\u5728ALFWorld\u4e2d\uff0c\u6211\u4eec\u4f7f\u7528\u4e86\u6240\u6709134\u4e2a\u672a\u89c1\u8fc7\u7684\u9a8c\u8bc1\u4efb\u52a1\u5b9e\u4f8b\uff0c\u5e76\u4f7f\u7528\u4e86\u6839\u636ePaLM-540B\u9009\u62e9\u7684\u6700\u4f73\u63d0\u793a\u96c6\u3002<\/p><\/div>\n<p>\u6211\u4eec\u8fdb\u884c\u4e86\u989d\u5916\u7684 GPT-3\uff08Brown \u7b49\u4eba\uff0c2020\uff09\u5b9e\u9a8c\uff0c\u4ee5\u786e\u8ba4ReAct \u63d0\u793a\u6027\u80fd\u5728\u4e0d\u540c\u5927\u578b\u8bed\u8a00\u6a21\u578b\u4e2d\u7684\u666e\u904d\u6027\u3002\u5982\u88685\u6240\u793a\uff0cGPT-3\uff08text-davinci-002\uff0cgreedy decoding\uff09\u5728 HotpotQA \u548c ALFWorld \u4e0a\u59cb\u7ec8\u4f18\u4e8e PaLM-540B\uff0c\u53ef\u80fd\u662f\u56e0\u4e3a\u5b83\u7ecf\u8fc7\u4e86\u9075\u5faa\u4eba\u7c7b\u6307\u4ee4\u7684\u5fae\u8c03\u3002\u8fd9\u8868\u660eReAct \u63d0\u793a\u5728\u4e0d\u540c\u4efb\u52a1\u4e0a\u5bf9\u4e0d\u540c\u7684\u5927\u578b\u8bed\u8a00\u6a21\u578b\u90fd\u662f\u6709\u6548\u7684\u3002\u8fd9\u4e9b\u5b9e\u9a8c\u7684\u4ee3\u7801\u53ef\u4ee5\u5728 https:\/\/react-lm.github.io\/ \u4e0a\u627e\u5230\u3002<\/p>\n<p>&nbsp;<\/p>\n<h3>A.2 ReAct \u5728 HotpotQA \u4e0a\u83b7\u53d6\u6700\u65b0\u77e5\u8bc6<\/h3>\n<div style=\"width: 1588px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2534\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-9\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/3be8e675de8f0da.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-9\" width=\"1578\" height=\"673\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/3be8e675de8f0da.png 1578w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/3be8e675de8f0da-300x128.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/3be8e675de8f0da-1024x437.png 1024w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/3be8e675de8f0da-768x328.png 768w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/3be8e675de8f0da-1536x655.png 1536w\" sizes=\"auto, (max-width: 1578px) 100vw, 1578px\" \/><p class=\"wp-caption-text\">\u56fe 4\uff1a\u53e6\u4e00\u4e2a\u4f8b\u5b50\u7684\u706b\u9505\u95ee\u7b54\u95ee\u9898\uff0c\u5176\u4e2d\u539f\u59cb\u6807\u7b7e\u5df2\u7ecf\u8fc7\u65f6\u3002\u53ea\u6709ReAct\u80fd\u591f\u901a\u8fc7\u5b9e\u9645\u7684\u7f51\u7edc\u4e92\u52a8\u52a0\u4e0a\u63a8\u7406\u83b7\u5f97\u6700\u65b0\u7684\u7b54\u6848\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<h3>A.3 \u5728 ALFWorld \u4e0a\u8fdb\u884c\u4eba\u7c7b\u53c2\u4e0e\u5faa\u73af\u7684\u884c\u4e3a\u6821\u6b63<\/h3>\n<p>\u6211\u4eec\u8fd8\u63a2\u7d22\u4e86\u4e0e ReAct \u7684\u4eba\u7c7b\u53c2\u4e0e\u5faa\u73af\u4ea4\u4e92\uff0c\u5141\u8bb8\u4eba\u7c7b\u68c0\u67e5\u548c\u7f16\u8f91 ReAct \u7684\u63a8\u7406\u75d5\u8ff9\u3002\u56fe5\u663e\u793a\uff0c\u4ec5\u4ec5\u901a\u8fc7\u79fb\u9664 Act 17 \u4e2d\u7684\u4e00\u53e5\u5e7b\u89c9\u53e5\u5b50\u5e76\u5728 Act 23 \u4e2d\u6dfb\u52a0\u4e00\u4e9b\u63d0\u793a\uff0c\u5c31\u53ef\u4ee5\u4f7f ReAct \u663e\u8457\u6539\u53d8\u5176\u884c\u4e3a\uff0c\u4e0e\u8fd9\u4e9b\u4eba\u7c7b\u601d\u7ef4\u7f16\u8f91\u5bf9\u9f50\uff0c\u5e76\u6210\u529f\u5b8c\u6210\u4efb\u52a1\u3002\u4ece\u4eba\u7c7b\u7684\u89d2\u5ea6\u6765\u770b\uff0c\u89e3\u51b3\u8fd9\u6837\u7684\u4efb\u52a1\u53d8\u5f97\u5bb9\u6613\u5f97\u591a\uff0c\u4ece\u8f93\u5165\u6570\u5341\u4e2a\u52a8\u4f5c\u5230\u4ec5\u7f16\u8f91\u51e0\u4e2a\u60f3\u6cd5\uff0c\u8fd9\u4f7f\u5f97\u65b0\u578b\u7684\u4eba\u673a\u534f\u4f5c\u6210\u4e3a\u53ef\u80fd\u3002\u6211\u4eec\u6ce8\u610f\u5230\uff0c\u5bf9\u4e8e Act \u548c\u4ee5\u524d\u7684 RL \u65b9\u6cd5\u6765\u8bf4\uff0c\u8fd9\u6837\u7684\u7b56\u7565\u7f16\u8f91\u662f\u56f0\u96be\u7684\uff0c\u56e0\u4e3a\u4eba\u7c7b\u65e0\u6cd5\u6539\u53d8\u6a21\u578b\u53c2\u6570\uff0c\u800c\u4e14\u6539\u53d8\u51e0\u4e2a\u52a8\u4f5c\u53ef\u80fd\u4e0d\u4f1a\u7f16\u8f91\u6a21\u578b\u7684\u5176\u4f59\u884c\u4e3a\u3002\u8fd9\u79cd\u8303\u5f0f\u4e5f\u4e0d\u4ec5\u4ec5\u662f\u4eba\u7c7b\u5bf9\u8bdd\u6765\u66f4\u65b0\u76ee\u6807\u6216\u5b50\u76ee\u6807\uff0c\u5982 Huang \u7b49\u4eba\uff082022b\uff09\u6240\u8ff0\u2014\u2014\u867d\u7136\u7f16\u8f91 ReAct \u60f3\u6cd5\u53ef\u4ee5\u505a\u5230\u8fd9\u4e9b\uff0c\u4f46\u5b83\u8fd8\u53ef\u4ee5\u4fee\u6539\u6a21\u578b\u7684\u5185\u90e8\u4fe1\u5ff5\u3001\u63a8\u7406\u98ce\u683c\u6216\u7075\u6d3b\u7684\u601d\u60f3\u7a7a\u95f4\u652f\u6301\u7684\u4efb\u4f55\u5185\u5bb9\uff0c\u4ee5\u66f4\u597d\u5730\u89e3\u51b3\u4efb\u52a1\u3002\u6211\u4eec\u76f8\u4fe1\u8fd9\u662f\u4eba\u7c7b\u5bf9\u9f50\u7684\u4e00\u4e2a\u4ee4\u4eba\u5174\u594b\u7684\u65b9\u5411\uff0c\u5e76\u7559\u4e0b\u66f4\u7cfb\u7edf\u7684\u7814\u7a76\u4f5c\u4e3a\u672a\u6765\u5de5\u4f5c\u3002<\/p>\n<p>&nbsp;<\/p>\n<div style=\"width: 1630px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2537\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-10\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cc1c19d7cc31d3c.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-10\" width=\"1620\" height=\"635\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cc1c19d7cc31d3c.png 1620w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cc1c19d7cc31d3c-300x118.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cc1c19d7cc31d3c-1024x401.png 1024w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cc1c19d7cc31d3c-768x301.png 768w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/cc1c19d7cc31d3c-1536x602.png 1536w\" sizes=\"auto, (max-width: 1620px) 100vw, 1620px\" \/><p class=\"wp-caption-text\">\u56fe 5\uff1a\u5728AlfWorld\u4e2d\u4f7f\u7528ReAct\u8fdb\u884c\u4eba\u673a\u4ea4\u4e92\u884c\u4e3a\u6821\u6b63\u7684\u793a\u4f8b\u3002 (a) \u7531\u4e8e\u5e7b\u89c9\u601d\u7ef4\uff08\u884c\u4e3a17\uff09\uff0cReAct\u8f68\u8ff9\u5931\u8d25\u3002 (b) \u901a\u8fc7\u7b80\u5355\u5730\u7531\u4eba\u7c7b\u7f16\u8f91\u4e24\u4e2a\u601d\u7ef4\uff08\u884c\u4e3a17, 23\uff09\uff0cReAct\u8f68\u8ff9\u4ea7\u751f\u4e86\u7406\u60f3\u7684\u63a8\u7406\u8f68\u8ff9\u548c\u884c\u52a8\uff0c\u5e76\u53d6\u5f97\u4e86\u6210\u529f\u3002<\/p><\/div>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>B \u5b9e\u9a8c\u7ec6\u8282<\/h2>\n<p>&nbsp;<\/p>\n<h3>B.1 \u70ed\u70b9\u95ee\u7b54\u5fae\u8c03\u7ec6\u8282<\/h3>\n<p>\u5bf9\u4e8e\u6240\u6709\u7684\u5fae\u8c03\uff0c\u6211\u4eec\u4f7f\u752864\u7684\u6279\u5904\u7406\u5927\u5c0f\u3002\u5728PaLM-8B\u4e0a\uff0c\u6211\u4eec\u5bf9ReAct\u548cAct\u65b9\u6cd5\u8fdb\u884c4,000\u6b65\u7684\u5fae\u8c03\uff0c\u5bf9\u6807\u51c6\u548cCoT\u65b9\u6cd5\u8fdb\u884c2,000\u6b65\u7684\u5fae\u8c03\u3002\u5728PaLM-62B\u4e0a\uff0c\u6211\u4eec\u5bf9ReAct\u548cAct\u65b9\u6cd5\u8fdb\u884c4,000\u6b65\u7684\u5fae\u8c03\uff0c\u5bf9\u6807\u51c6\u548cCoT\u65b9\u6cd5\u8fdb\u884c1,000\u6b65\u7684\u5fae\u8c03\u3002\u6211\u4eec\u53d1\u73b0ReAct\u548cAct\u65b9\u6cd5\u901a\u5e38\u4ece\u66f4\u591a\u7684\u8bad\u7ec3\u6b65\u9aa4\uff08\u4ee5\u53ca\u66f4\u591a\u7684\u8bad\u7ec3\u6570\u636e\uff09\u4e2d\u53d7\u76ca\uff0c\u800c\u6807\u51c6\u548cCoT\u65b9\u6cd5\u5728\u5fae\u8c03\u540e\u5f88\u5feb\u5c31\u5f00\u59cb\u9000\u5316\u3002<\/p>\n<p>&nbsp;<\/p>\n<h3>B.2 ALFWORLD\u5373\u65f6\u98ce\u683c\u7ec6\u8282<\/h3>\n<p>\u5bf9\u4e8e\u5373\u65f6\u98ce\u683c\u7684\u6d88\u878d\u5b9e\u9a8c\uff0c\u4e0eReAct\u4e2d\u4f7f\u7528\u7684\u76f8\u540c\u7684\u4e13\u5bb6\u8f68\u8ff9\u88ab\u91cd\u65b0\u6ce8\u91ca\uff0c\u8fd9\u4e9b\u8f68\u8ff9\u5185\u90e8\u5305\u542b\u4e86\u5bc6\u96c6\u7684\u5916\u90e8\u53cd\u9988\u601d\u7ef4\uff0c\u8fd9\u4e9b\u53cd\u9988\u9650\u5236\u4e86ReAct-IM\u4ec5\u8003\u8651(1)\u5206\u89e3\u5f53\u524d\u76ee\u6807\u548c(2)\u9700\u8981\u5b8c\u6210\u7684\u5f53\u524d\u5b50\u76ee\u6807\u3002\u5177\u4f53\u6765\u8bf4\uff0cReAct-IM\u7f3a\u4e4f(1)\u786e\u5b9a\u5b50\u76ee\u6807\u4f55\u65f6\u5b8c\u6210\u7684\u601d\u8003(2)\u786e\u5b9a\u4e0b\u4e00\u4e2a\u5b50\u76ee\u6807\u5e94\u8be5\u662f\u4ec0\u4e48\u7684\u601d\u8003(3)\u8bf1\u5bfcLLM\u53c2\u8003\u5176\u5185\u90e8\u9884\u8bad\u7ec3\u77e5\u8bc6\u4ee5\u8bc6\u522b\u73af\u5883\u4e2d\u7269\u54c1\u53ef\u80fd\u7684\u4f4d\u7f6e\u7684\u601d\u8003\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>C PROMPTS<\/h2>\n<p>&nbsp;<\/p>\n<h3>C.1 \u70ed\u70b9\u95ee\u7b54<\/h3>\n<p>\u70ed\u70b9\u95ee\u7b54\u63d0\u793a<\/p>\n<table width=\"950\">\n<tbody>\n<tr>\n<td colspan=\"2\" width=\"950\">Original<\/td>\n<\/tr>\n<tr>\n<td>Question<\/td>\n<td>Answer<\/td>\n<\/tr>\n<tr>\n<td>What&#8217;s the elevation range for the area that the eastern sector of the Colorado orogeny extends into?<\/td>\n<td>1,800 to 7,000 ft<\/td>\n<\/tr>\n<tr>\n<td>Musician and satirist Allie Goertz wrote a song about &#8220;The Simpsons&#8221; <a href=\"https:\/\/www.kdjingpai.com\/en\/character-ai\/\">character<\/a> Milhouse. Who did Matt Groening name after Nixon?<\/td>\n<td>Richard Nixon<\/td>\n<\/tr>\n<tr>\n<td>Which documentary is about Finnish rock groups, Adam Clayton Powell, or The Saimaa Gesture?<\/td>\n<td>The Saimaa Gesture<\/td>\n<\/tr>\n<tr>\n<td>What profession do Nicholas Ray and Elia Kazan have in common?<\/td>\n<td>Director, screenwriter, actor<\/td>\n<\/tr>\n<tr>\n<td>Which magazine was started first, Arthur&#8217;s Magazine or First for Women?<\/td>\n<td>Arthur&#8217;s Magazine<\/td>\n<\/tr>\n<tr>\n<td>Are Pavel Urysohn and Leonid Levin known for the same type of work?<\/td>\n<td>Yes<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"442\">\n<tbody>\n<tr>\n<td colspan=\"2\" width=\"442\">Original<\/td>\n<\/tr>\n<tr>\n<td>\u95ee\u9898<\/td>\n<td>\u7b54\u6848<\/td>\n<\/tr>\n<tr>\n<td>\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u8fd0\u52a8\u4e1c\u6bb5\u5ef6\u4f38\u533a\u57df\u7684\u6d77\u62d4\u8303\u56f4\u662f\u591a\u5c11\uff1f<\/td>\n<td>1,800\u81f37,000\u82f1\u5c3a<\/td>\n<\/tr>\n<tr>\n<td>\u97f3\u4e50\u5bb6\u548c\u8bbd\u523a\u4f5c\u5bb6Allie Goertz\u4e3a&#8221;\u8f9b\u666e\u68ee\u4e00\u5bb6&#8221;\u4e2d\u7684\u89d2\u8272Milhouse\u5199\u4e86\u4e00\u9996\u6b4c\u3002Matt Groening\u662f\u6839\u636e\u5c3c\u514b\u677e\u7684\u54ea\u4e2a\u4eba\u547d\u540d\u7684\uff1f<\/td>\n<td>\u7406\u67e5\u5fb7\u00b7\u5c3c\u514b\u677e<\/td>\n<\/tr>\n<tr>\n<td>\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u3001\u4e9a\u5f53\u00b7\u514b\u83b1\u987f\u00b7\u9c8d\u5a01\u5c14\u6216\u8428\u4f0a\u9a6c\u884c\u52a8\u7684\u7eaa\u5f55\u7247\u662f\u54ea\u4e00\u90e8\uff1f<\/td>\n<td>\u8428\u4f0a\u9a6c\u884c\u52a8<\/td>\n<\/tr>\n<tr>\n<td>\u5c3c\u53e4\u62c9\u65af\u00b7\u96f7\u548c\u827e\u5229\u4e9a\u00b7\u5361\u8d5e\u6709\u4ec0\u4e48\u5171\u540c\u7684\u804c\u4e1a\uff1f<\/td>\n<td>\u5bfc\u6f14\u3001\u7f16\u5267\u3001\u6f14\u5458<\/td>\n<\/tr>\n<tr>\n<td>\u54ea\u672c\u6742\u5fd7\u521b\u529e\u66f4\u65e9\uff0cArthur&#8217;s Magazine\u8fd8\u662fFirst for Women\uff1f<\/td>\n<td>Arthur&#8217;s Magazine<\/td>\n<\/tr>\n<tr>\n<td>\u5e15\u7ef4\u5c14\u00b7\u4e4c\u91cc\u677e\u548c\u5217\u6602\u5c3c\u5fb7\u00b7\u5217\u6587\u662f\u5426\u4ee5\u540c\u4e00\u7c7b\u578b\u7684\u5de5\u4f5c\u800c\u95fb\u540d\uff1f<\/td>\n<td>\u662f<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"1208\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"1208\">Act<\/td>\n<\/tr>\n<tr>\n<td>Question<\/td>\n<td>Action<\/td>\n<td>Observation<\/td>\n<\/tr>\n<tr>\n<td>What is the elevation range for the area that the eastern sector of the Colorado orogeny extends into?<\/td>\n<td>Search[Colorado orogeny]<\/td>\n<td>The Colorado orogeny was an episode of mountain building (an orogeny) in Colorado and surrounding areas.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Lookup[eastern sector]<\/td>\n<td>(Result 1 \/ i) The eastern sector extends into the High Plains and is called the Central Plains orogeny.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Search[High Plains]<\/td>\n<td>High Plains refers to one of two distinct land regions:<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Search[High Plains (United States)]<\/td>\n<td>The High Plains are a subregion of the Great Plains. From east to west, the High Plains rise in elevation from around 1,800 to 7,000 ft (550 to 2,130 m).[3]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish<\/td>\n<td>[1,800 to 7,000 ft]<\/td>\n<\/tr>\n<tr>\n<td>Musician and satirist Allie Goertz wrote a song about the &#8220;The Simpsons&#8221; character Milhouse, who Matt Groening named after who?<\/td>\n<td>Search[Milhouse]<\/td>\n<td>Milhouse Mussolini Van Houten is a recurring character in the Fox animated television series The simpsons voiced by Pamela Hayden and created by Matt Groening.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Lookup[named after]<\/td>\n<td>(Result 1 \/ l) Milhouse was named after U.S. president Richard Nixon, whose middle name was Milhous.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish<\/td>\n<td>[Richard Nixon]<\/td>\n<\/tr>\n<tr>\n<td>Which documentary is about Finnish rock groups, Adam clayton Powell or The Saimaa Gesture?<\/td>\n<td>Search[Adam clayton Powell]<\/td>\n<td>Could not find [Adam clayton Powell]. Similar: [&#8216;Adam Clayton Powel III&#8217;, &#8216;Seventh Avenue (Manhattan)&#8217;, &#8216;Adam clayton Powell Jr. State office Building&#8217;, &#8216;Isabel Washington Powell&#8217;, &#8216;Adam Powell&#8217;, &#8216;Adam Clayton Powell (film)&#8221;, &#8220;Giancarlo Esposito&#8221;].<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Search[Adam clayton Powell (film)]<\/td>\n<td>Adam clayton Powell is a 1989 American documentary film directed by Richard Kilberg. The film is about the rise and fall of influential African-American politician Adam clayton Powell Jr.[3][4] It was later aired as part of the PBs series The American Experience.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish<\/td>\n<td>[The Saimaa Gesture]<\/td>\n<\/tr>\n<tr>\n<td>What profession does Nicholas Ray and Elia Kazan have in common?<\/td>\n<td>Search[Nicholas Ray]<\/td>\n<td>Nicholas Ray (born Raymond Nicholas Kienzle Jr., ) August 7,1911 -June16, 1979) was an American film director, screenwriter, and actor best known for the 1955 film Rebel Without a Cause.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Search[Elia Kazan]<\/td>\n<td>Elia Kazan was an American film and theatre director, producer, screenwriter and actor.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u00a0Finish[director, screenwriter, actor]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Which magazine was started first Arthur\u2019s Magazine or First for Women?<\/td>\n<td>Search[Arthur\u2019s Magazine]<\/td>\n<td>Arthur\u2019s Magazine (1844-1846) was an American literary periodical published in Philadelphia in the 19th century.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Search[First for Women]<\/td>\n<td>First for Women is a woman\u2019s magazine published by Bauer Media Group in the USA.[1] The magazine was started in 1989.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish[Arthur\u2019s Magazine]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Were Pavel Urysohn and Leonid Levin known for the same type of work?<\/td>\n<td>Search[Pavel Urysohn]<\/td>\n<td>Pavel Samuilovich Urysohn (February 3, 1898 &#8211; August 17, 1924) was a Soviet mathematician who is best known for his contributions in dimension theory.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Search[Leonid Levin]<\/td>\n<td>Leonid Anatolievich Levin is a Soviet-American mathematician and <a href=\"https:\/\/www.kdjingpai.com\/en\/tldraw-computer\/\">computer<\/a> scientist.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish[yes]<\/td>\n<td><\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"490\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"490\">Act<\/td>\n<\/tr>\n<tr>\n<td>\u95ee\u9898<\/td>\n<td>\u52a8\u4f5c<\/td>\n<td>\u89c2\u5bdf<\/td>\n<\/tr>\n<tr>\n<td>\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u8fd0\u52a8\u4e1c\u6bb5\u5ef6\u4f38\u5230\u7684\u5730\u533a\u7684\u6d77\u62d4\u8303\u56f4\u662f\u591a\u5c11\uff1f<\/td>\n<td>\u641c\u7d22[\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u8fd0\u52a8]<\/td>\n<td>\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u8fd0\u52a8\u662f\u79d1\u7f57\u62c9\u591a\u53ca\u5176\u5468\u8fb9\u5730\u533a\u53d1\u751f\u7684\u4e00\u6b21\u9020\u5c71\u8fd0\u52a8\uff08\u9020\u5c71\u8fd0\u52a8\uff09\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u67e5\u627e[\u4e1c\u6bb5]<\/td>\n<td>(\u7ed3\u679c 1 \/ i) \u4e1c\u6bb5\u5ef6\u4f38\u5230\u9ad8\u5e73\u539f\uff0c\u5e76\u88ab\u79f0\u4e3a\u4e2d\u592e\u5e73\u539f\u9020\u5c71\u8fd0\u52a8\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u641c\u7d22[\u9ad8\u5e73\u539f]<\/td>\n<td>\u9ad8\u5e73\u539f\u6307\u7684\u662f\u4e24\u4e2a\u4e0d\u540c\u7684\u5730\u533a\u4e4b\u4e00\uff1a<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u641c\u7d22[\u9ad8\u5e73\u539f (\u7f8e\u56fd)]<\/td>\n<td>\u9ad8\u5e73\u539f\u662f\u5927\u5e73\u539f\u7684\u4e00\u4e2a\u5b50\u533a\u57df\u3002\u4ece\u4e1c\u5230\u897f\uff0c\u9ad8\u5e73\u539f\u7684\u6d77\u62d4\u4ece\u5927\u7ea61,800\u82f1\u5c3a\uff08550\u7c73\uff09\u4e0a\u5347\u52307,000\u82f1\u5c3a\uff082,130\u7c73\uff09\u3002[3]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210<\/td>\n<td>[1,800\u81f37,000\u82f1\u5c3a]<\/td>\n<\/tr>\n<tr>\n<td>\u97f3\u4e50\u5bb6\u548c\u8bbd\u523a\u5bb6Allie Goertz\u5199\u4e86\u4e00\u9996\u5173\u4e8e\u300a\u8f9b\u666e\u68ee\u4e00\u5bb6\u300b\u4e2d\u7684\u89d2\u8272Milhouse\u7684\u6b4c\u66f2\uff0cMatt Groening\u662f\u6839\u636e\u8c01\u7684\u540d\u5b57\u6765\u547d\u540d\u8fd9\u4e2a\u89d2\u8272\u7684\uff1f<\/td>\n<td>\u641c\u7d22[Milhouse]<\/td>\n<td>Milhouse Mussolini Van Houten\u662f\u798f\u514b\u65af\u52a8\u753b\u7535\u89c6\u5267\u300a\u8f9b\u666e\u68ee\u4e00\u5bb6\u300b\u4e2d\u7684\u4e00\u4e2a\u5e38\u9a7b\u89d2\u8272\uff0c\u7531Pamela Hayden\u914d\u97f3\uff0c\u5e76\u7531Matt Groening\u521b\u9020\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u67e5\u627e[\u547d\u540d\u6765\u6e90]<\/td>\n<td>(\u7ed3\u679c 1 \/ l) Milhouse\u662f\u6839\u636e\u7f8e\u56fd\u603b\u7edfRichard Nixon\u7684\u540d\u5b57\u547d\u540d\u7684\uff0c\u4ed6\u7684\u4e2d\u95f4\u540d\u662fMilhous\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210<\/td>\n<td>[Richard Nixon]<\/td>\n<\/tr>\n<tr>\n<td>\u54ea\u90e8\u7eaa\u5f55\u7247\u662f\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\uff0cAdam Clayton Powell\u8fd8\u662fThe Saimaa Gesture\uff1f<\/td>\n<td>\u641c\u7d22[Adam Clayton Powell]<\/td>\n<td>\u672a\u627e\u5230[Adam Clayton Powell]\u3002\u76f8\u4f3c\u7684\u6709\uff1a[&#8216;Adam Clayton Powel III&#8217;, &#8216;Seventh Avenue (\u66fc\u54c8\u987f)&#8217;, &#8216;Adam clayton Powell Jr. \u5dde\u7acb\u529e\u516c\u697c&#8217;, &#8216;Isabel Washington Powell&#8217;, &#8216;Adam Powell&#8217;, &#8216;Adam Clayton Powell (\u7535\u5f71)&#8221;, &#8220;Giancarlo Esposito&#8221;]\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u641c\u7d22[Adam Clayton Powell (\u7535\u5f71)]<\/td>\n<td>Adam Clayton Powell\u662f\u4e00\u90e81989\u5e74\u7531Richard Kilberg\u6267\u5bfc\u7684\u7f8e\u56fd\u7eaa\u5f55\u7247\u7535\u5f71\u3002\u8be5\u7535\u5f71\u8bb2\u8ff0\u4e86\u6709\u5f71\u54cd\u529b\u7684\u975e\u88d4\u7f8e\u56fd\u653f\u6cbb\u5bb6Adam Clayton Powell Jr.\u7684\u5174\u8870\u3002[3][4] \u540e\u6765\u4f5c\u4e3aPBS\u7cfb\u5217\u8282\u76ee\u300a\u7f8e\u56fd\u7ecf\u5386\u300b\u7684\u4e00\u90e8\u5206\u64ad\u51fa\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210<\/td>\n<td>[The Saimaa Gesture]<\/td>\n<\/tr>\n<tr>\n<td>Nicholas Ray\u548cElia Kazan\u6709\u4ec0\u4e48\u5171\u540c\u7684\u804c\u4e1a\uff1f<\/td>\n<td>\u641c\u7d22[Nicholas Ray]<\/td>\n<td>Nicholas Ray\uff08\u672c\u540dRaymond Nicholas Kienzle Jr.\uff0c\uff091911\u5e748\u67087\u65e5-1979\u5e746\u670816\u65e5\uff09\u662f\u4e00\u4f4d\u7f8e\u56fd\u7535\u5f71\u5bfc\u6f14\u3001\u7f16\u5267\u548c\u6f14\u5458\uff0c\u4ee51955\u5e74\u7684\u7535\u5f71\u300a\u65e0\u56e0\u7684\u53cd\u53db\u300b\u6700\u4e3a\u4eba\u6240\u77e5\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u641c\u7d22[Elia Kazan]<\/td>\n<td>Elia Kazan\u662f\u4e00\u4f4d\u7f8e\u56fd\u7535\u5f71\u548c\u620f\u5267\u5bfc\u6f14\u3001\u5236\u7247\u4eba\u3001\u7f16\u5267\u548c\u6f14\u5458\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210[\u5bfc\u6f14\uff0c\u7f16\u5267\uff0c\u6f14\u5458]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>\u54ea\u672c\u6742\u5fd7\u5148\u521b\u529e\u7684\uff0cArthur\u2019s Magazine\u8fd8\u662fFirst for Women\uff1f<\/td>\n<td>\u641c\u7d22[Arthur\u2019s Magazine]<\/td>\n<td>Arthur\u2019s Magazine\uff081844-1846\uff09\u662f19\u4e16\u7eaa\u5728\u7f8e\u56fd\u8d39\u57ce\u51fa\u7248\u7684\u4e00\u672c\u7f8e\u56fd\u6587\u5b66\u671f\u520a\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u641c\u7d22[First for Women]<\/td>\n<td>First for Women\u662fBauer Media Group\u5728\u7f8e\u56fd\u51fa\u7248\u7684\u4e00\u672c\u5973\u6027\u6742\u5fd7\u3002[1] \u8be5\u6742\u5fd7\u59cb\u521b\u4e8e1989\u5e74\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210[Arthur\u2019s Magazine]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Pavel Urysohn\u548cLeonid Levin\u662f\u5426\u56e0\u540c\u4e00\u7c7b\u578b\u7684\u5de5\u4f5c\u800c\u95fb\u540d\uff1f<\/td>\n<td>\u641c\u7d22[Pavel Urysohn]<\/td>\n<td>Pavel Samuilovich Urysohn\uff081898\u5e742\u67083\u65e5-1924\u5e748\u670817\u65e5\uff09\u662f\u4e00\u4f4d\u82cf\u8054\u6570\u5b66\u5bb6\uff0c\u4ee5\u5176\u5728\u7ef4\u6570\u8bba\u65b9\u9762\u7684\u8d21\u732e\u800c\u6700\u4e3a\u4eba\u6240\u77e5\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u641c\u7d22[Leonid Levin]<\/td>\n<td>Leonid Anatolievich Levin\u662f\u4e00\u4f4d\u82cf\u8054-\u7f8e\u56fd\u6570\u5b66\u5bb6\u548c\u8ba1\u7b97\u673a\u79d1\u5b66\u5bb6\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210[\u662f]<\/td>\n<td><\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"1208\">\n<tbody>\n<tr>\n<td colspan=\"2\" width=\"950\">CoT<\/td>\n<td width=\"258\"><\/td>\n<\/tr>\n<tr style=\"font-weight: var(--table-header-weight);\">\n<td>Question<\/td>\n<td>Thought<\/td>\n<td>Answer<\/td>\n<\/tr>\n<tr>\n<td>What is the elevation range for the area that the eastern sector of the Colorado orogeny extends into?<\/td>\n<td>Let&#8217;s think step by step. The eastern sector of Colorado orogeny extends into the High Plains. High Plains rise in elevation from around 1,800 to 7,000 ft, so the answer is 1,800 to 7,000 ft.<\/td>\n<td>1,800 to 7,000 ft<\/td>\n<\/tr>\n<tr>\n<td>Musician and satirist Allie Goertz wrote a song about the &#8220;The Simpsons&#8221; character Milhouse, who Matt Groening named after who?<\/td>\n<td>Let&#8217;s think step by step. Milhouse was named after U.S. president Richard Nixon, so the answer is Richard Nixon.<\/td>\n<td>Richard Nixon<\/td>\n<\/tr>\n<tr>\n<td>Which documentary is about Finnish rock groups, Adam Clayton Powell or The Saimaa Gesture?<\/td>\n<td>Let&#8217;s think step by step. Adam Clayton Powell (film) is a documentary about an African-American politician, not Finnish rock groups. So the documentary about Finnish rock groups must instead be The Saimaa Gesture.<\/td>\n<td>The Saimaa Gesture<\/td>\n<\/tr>\n<tr>\n<td>What profession does Nicholas Ray and Elia Kazan have in common?<\/td>\n<td>Let&#8217;s think step by step. Professions of Nicholas Ray are director, screenwriter, and actor. Professions of Elia Kazan are director, producer, screenwriter, and actor. So profession Nicholas Ray and Elia Kazan have in common is director, screenwriter, and actor.<\/td>\n<td>director, screenwriter, actor<\/td>\n<\/tr>\n<tr>\n<td>Which magazine was started first Arthur&#8217;s Magazine or First for Women?<\/td>\n<td>Let&#8217;s think step by step. Arthur&#8217;s Magazine was started in 1844. First for Women was started in 1989. 1844 (Arthur&#8217;s Magazine) &lt; 1989 (First for Women), so Arthur&#8217;s Magazine was started first.<\/td>\n<td>Arthur&#8217;s Magazine<\/td>\n<\/tr>\n<tr>\n<td>Were Pavel Urysohn and Leonid Levin known for the same type of work?<\/td>\n<td>Let&#8217;s think step by step. Pavel Urysohn is a mathematician. Leonid Levin is a mathematician and computer scientist. So Pavel Urysohn and Leonid Levin have the same type of work.<\/td>\n<td>Yes<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"757\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"757\">CoT<\/td>\n<\/tr>\n<tr>\n<td>\u95ee\u9898<\/td>\n<td>\u601d\u8003\u8fc7\u7a0b<\/td>\n<td>\u7b54\u6848<\/td>\n<\/tr>\n<tr>\n<td>\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u8fd0\u52a8\u4e1c\u6bb5\u5ef6\u4f38\u5230\u7684\u5730\u533a\u7684\u6d77\u62d4\u8303\u56f4\u662f\u591a\u5c11\uff1f<\/td>\n<td>\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u8003\u8651\u3002\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u8fd0\u52a8\u7684\u4e1c\u6bb5\u5ef6\u4f38\u5230\u9ad8\u5e73\u539f\u3002\u9ad8\u5e73\u539f\u7684\u6d77\u62d4\u4ece\u5927\u7ea61,800\u82f1\u5c3a\u5347\u9ad8\u52307,000\u82f1\u5c3a\uff0c\u6240\u4ee5\u7b54\u6848\u662f1,800\u52307,000\u82f1\u5c3a\u3002<\/td>\n<td>1,800\u52307,000\u82f1\u5c3a<\/td>\n<\/tr>\n<tr>\n<td>\u97f3\u4e50\u5bb6\u548c\u8bbd\u523a\u5bb6Allie Goertz\u4e3a\u300a\u8f9b\u666e\u68ee\u4e00\u5bb6\u300b\u4e2d\u7684\u89d2\u8272Milhouse\u5199\u4e86\u4e00\u9996\u6b4c\uff0cMatt Groening\u662f\u6839\u636e\u8c01\u6765\u547d\u540d\u8fd9\u4e2a\u89d2\u8272\u7684\uff1f<\/td>\n<td>\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u8003\u8651\u3002Milhouse\u662f\u6839\u636e\u7f8e\u56fd\u603b\u7edf\u7406\u67e5\u5fb7\u00b7\u5c3c\u514b\u677e\u6765\u547d\u540d\u7684\uff0c\u6240\u4ee5\u7b54\u6848\u662f\u7406\u67e5\u5fb7\u00b7\u5c3c\u514b\u677e\u3002<\/td>\n<td>\u7406\u67e5\u5fb7\u00b7\u5c3c\u514b\u677e<\/td>\n<\/tr>\n<tr>\n<td>\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\u7eaa\u5f55\u7247\u662f\u300a\u4e9a\u5f53\u00b7\u514b\u83b1\u987f\u00b7\u9c8d\u5a01\u5c14\u300b\u8fd8\u662f\u300a\u585e\u9a6c\u96c5\u624b\u52bf\u300b\uff1f<\/td>\n<td>\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u8003\u8651\u3002\u300a\u4e9a\u5f53\u00b7\u514b\u83b1\u987f\u00b7\u9c8d\u5a01\u5c14\u300b(\u7535\u5f71)\u662f\u4e00\u90e8\u5173\u4e8e\u975e\u88d4\u7f8e\u56fd\u653f\u6cbb\u5bb6\u7684\u7eaa\u5f55\u7247\uff0c\u4e0d\u662f\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\u3002\u6240\u4ee5\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\u7eaa\u5f55\u7247\u5e94\u8be5\u662f\u300a\u585e\u9a6c\u96c5\u624b\u52bf\u300b\u3002<\/td>\n<td>\u300a\u585e\u9a6c\u96c5\u624b\u52bf\u300b<\/td>\n<\/tr>\n<tr>\n<td>\u5c3c\u53e4\u62c9\u65af\u00b7\u96f7\u548c\u4f0a\u5229\u4e9a\u00b7\u5361\u8d5e\u6709\u4ec0\u4e48\u5171\u540c\u7684\u804c\u4e1a\uff1f<\/td>\n<td>\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u8003\u8651\u3002\u5c3c\u53e4\u62c9\u65af\u00b7\u96f7\u7684\u804c\u4e1a\u662f\u5bfc\u6f14\u3001\u7f16\u5267\u548c\u6f14\u5458\u3002\u4f0a\u5229\u4e9a\u00b7\u5361\u8d5e\u7684\u804c\u4e1a\u662f\u5bfc\u6f14\u3001\u5236\u7247\u4eba\u3001\u7f16\u5267\u548c\u6f14\u5458\u3002\u6240\u4ee5\u5c3c\u53e4\u62c9\u65af\u00b7\u96f7\u548c\u4f0a\u5229\u4e9a\u00b7\u5361\u8d5e\u5171\u540c\u7684\u804c\u4e1a\u662f\u5bfc\u6f14\u3001\u7f16\u5267\u548c\u6f14\u5458\u3002<\/td>\n<td>\u5bfc\u6f14\u3001\u7f16\u5267\u3001\u6f14\u5458<\/td>\n<\/tr>\n<tr>\n<td>\u662f\u300a\u963f\u745f\u6742\u5fd7\u300b\u8fd8\u662f\u300a\u9996\u5148\u4e3a\u5973\u6027\u300b\u5148\u521b\u529e\u7684\uff1f<\/td>\n<td>\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u8003\u8651\u3002\u300a\u963f\u745f\u6742\u5fd7\u300b\u521b\u529e\u4e8e1844\u5e74\u3002\u300a\u9996\u5148\u4e3a\u5973\u6027\u300b\u521b\u529e\u4e8e1989\u5e74\u30021844\u5e74(\u300a\u963f\u745f\u6742\u5fd7\u300b) &lt; 1989\u5e74(\u300a\u9996\u5148\u4e3a\u5973\u6027\u300b)\uff0c\u6240\u4ee5\u300a\u963f\u745f\u6742\u5fd7\u300b\u662f\u5148\u521b\u529e\u7684\u3002<\/td>\n<td>\u300a\u963f\u745f\u6742\u5fd7\u300b<\/td>\n<\/tr>\n<tr>\n<td>Pavel Urysohn\u548cLeonid Levin\u662f\u5426\u56e0\u540c\u4e00\u7c7b\u578b\u7684\u5de5\u4f5c\u800c\u95fb\u540d\uff1f<\/td>\n<td>\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u8003\u8651\u3002Pavel Urysohn\u662f\u4e00\u4f4d\u6570\u5b66\u5bb6\u3002Leonid Levin\u662f\u4e00\u4f4d\u6570\u5b66\u5bb6\u548c\u8ba1\u7b97\u673a\u79d1\u5b66\u5bb6\u3002\u6240\u4ee5Pavel Urysohn\u548cLeonid Levin\u6709\u76f8\u540c\u7c7b\u578b\u7684\u5de5\u4f5c\u3002<\/td>\n<td>\u662f<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"1280\">\n<tbody>\n<tr>\n<td colspan=\"2\" width=\"950\">ReAct<\/td>\n<td width=\"258\"><\/td>\n<td width=\"72\"><\/td>\n<\/tr>\n<tr>\n<td>Question<\/td>\n<td>Thought<\/td>\n<td>Action<\/td>\n<td>Observation<\/td>\n<\/tr>\n<tr>\n<td>What is the elevation range for the area that the eastern sector of the Colorado orogeny extends into?<\/td>\n<td>I need to search Colorado orogeny, find the area that the eastern sector of the Colorado orogeny extends into, then find the elevation range of the area.<\/td>\n<td>Search[Colorado orogeny]<\/td>\n<td>The Colorado orogeny was an episode of mountain building (anorogeny) in Colorado and surrounding areas.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>It does not mention the eastern sector. So I need to look up eastern sector.<\/td>\n<td>Lookup[eastern sector]<\/td>\n<td>\u00a0(Result 1 \/ 1) The eastern sector extends into the High Plains and is called the Central Plains orogeny.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>The eastern sector of Colorado orogeny extends into the High Plains. So I need to search High Plains and find its elevation range.<\/td>\n<td>Search[High Plains]<\/td>\n<td>High Plains refers to one of two distinct land regions<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>I need to instead search High Plains (United States).<\/td>\n<td>Search[High Plains (United States)]<\/td>\n<td>The High Plains are a subregion of the Great Plains. From east to west, the High Plains rise in elevation from around 1,800 to 7,000 ft (550 to 2,130 m).[3]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td width=\"425\">\u00a0High Plains rise in elevation from around 1,800 to 7,000 ft, so the answer<br \/>\nis 1,800 to 7,000 ft.<\/td>\n<td>Finish[1,800 to 7,000 ft]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td><\/td>\n<td><\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Musician and satirist Allie Goertz wrote a song about the &#8220;The Simpsons&#8221; character Milhouse, who Matt Groening named after who?<\/td>\n<td>The question simplifies to &#8220;The Simpsons&#8221; character Milhouse is named after who. I only need to search Milhouse and find who it is named after.<\/td>\n<td>Search[Milhouse]<\/td>\n<td>Milhouse Mussolini Van Houten is a recurring character in the Fox animated television series The Simpsons voiced by Pamela Hayden and created by Matt Groening.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>The paragraph does not tell who Milhouse is named after, maybe I can look up &#8220;named after&#8221;.<\/td>\n<td>Lookup[named after]<\/td>\n<td>(Result 1 \/ 1) Milhouse was named after U.S. president Richard Nixon, whose middle name was Milhous.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Milhouse was named after U.S. president Richard Nixon, so the answer is Richard Nixon.<\/td>\n<td>Finish[Richard Nixon]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Which documentary is about Finnish rock groups, Adam Clayton Powell or The Saimaa Gesture?<\/td>\n<td>I need to search Adam Clayton Powell and The Saimaa Gesture, and find which documentary is about Finnish rock groups.<\/td>\n<td>Search[Adam Clayton Powell]<\/td>\n<td>Could not find [Adam Clayton Powell]. Similar: [\u2019Adam Clayton Powell III\u2019, \u2019Seventh Avenue (Manhattan)\u2019, \u2019Adam Clayton Powell Jr. State Office Building\u2019, \u2019Isabel Washington Powell\u2019, \u2019Adam Powell\u2019, \u2019Adam Clayton Powell (film)\u2019, \u2019Giancarlo Esposito\u2019].<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>To find the documentary, I can search Adam Clayton Powell (film).<\/td>\n<td>Search[Adam Clayton Powell (film)]<\/td>\n<td>Adam Clayton Powell is a 1989 American documentary film directed by Richard Kilberg. The film is about the rise and fall of influential African-American politician Adam Clayton Powell Jr.[3][4] It was later aired as part of the PBS series The American Experience.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Adam Clayton Powell (film) is a documentary about an African-American politician, not Finnish rock groups. So the documentary about Finnish rock groups must instead be The Saimaa Gesture.<\/td>\n<td>Finish[The Saimaa Gesture]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>What profession does Nicholas Ray and Elia Kazan have in common?<\/td>\n<td>I need to search Nicholas Ray and Elia Kazan, find their professions, then find the profession they have in common.<\/td>\n<td>Search[Nicholas Ray]<\/td>\n<td>Nicholas Ray (born Raymond Nicholas Kienzle Jr., August 7, 1911 &#8211; June 16, 1979) was an American film director, screenwriter, and actor best known for the 1955 film Rebel Without a Cause.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Professions of Nicholas Ray are director, screenwriter, and actor. I need to search Elia Kazan next and find his professions.<\/td>\n<td>Search[Elia Kazan]<\/td>\n<td>Elia Kazan was an American film and theatre director, producer, screenwriter and actor.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Professions of Elia Kazan are director, producer, screenwriter, and actor. So profession Nicholas Ray and Elia Kazan have in common is director, screenwriter, and actor.<\/td>\n<td>Finish[director, screenwriter, actor]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Which magazine was started first Arthur\u2019s Magazine or First for Women?<\/td>\n<td>I need to search Arthur\u2019s Magazine and First for Women, and find which was started first.<\/td>\n<td>Search[Arthur\u2019s Magazine]<\/td>\n<td>Arthur\u2019s Magazine (1844-1846) was an American literary periodical published in Philadelphia in the 19th century.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Arthur\u2019s Magazine was started in 1844. I need to search First for Women next.<\/td>\n<td>Search[First for Women]<\/td>\n<td>First for Women is a woman\u2019s magazine published by Bauer Media Group in the USA.[1] The magazine was started in 1989.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>First for Women was started in 1989. 1844 (Arthur\u2019s Magazine) &lt; 1989 (First for Women), so Arthur\u2019s Magazine was started first.<\/td>\n<td>Finish[Arthur\u2019s Magazine]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Were Pavel Urysohn and Leonid Levin known for the same type of work?<\/td>\n<td>I need to search Pavel Urysohn and Leonid Levin, find their types of work, then find if they are the same.<\/td>\n<td>Search[Pavel Urysohn]<\/td>\n<td>Pavel Samuilovich Urysohn (February 3, 1898 &#8211; August 17, 1924) was a Soviet mathematician who is best known for his contributions in dimension theory.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Pavel Urysohn is a mathematician. I need to search Leonid Levin next and find its type of work.<\/td>\n<td>Search[Leonid Levin]<\/td>\n<td>Leonid Anatolievich Levin is a Soviet-American mathematician and computer scientist.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Leonid Levin is a mathematician and computer scientist. So Pavel Urysohn and Leonid Levin have the same type of work.<\/td>\n<td>Finish[yes]<\/td>\n<td><\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"757\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"757\">\n<p data-tag-name=\"table\">ReAct<\/p>\n<\/td>\n<\/tr>\n<tr>\n<td>\u95ee\u9898<\/td>\n<td>\u601d\u8003<\/td>\n<td>\u884c\u52a8<\/td>\n<\/tr>\n<tr>\n<td>\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u5e26\u4e1c\u6bb5\u5ef6\u4f38\u5230\u7684\u533a\u57df\u7684\u6d77\u62d4\u8303\u56f4\u662f\u591a\u5c11\uff1f<\/td>\n<td>\u6211\u9700\u8981\u641c\u7d22\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u5e26\uff0c\u627e\u5230\u4e1c\u6bb5\u5ef6\u4f38\u5230\u7684\u533a\u57df\uff0c\u7136\u540e\u627e\u5230\u8be5\u533a\u57df\u7684\u6d77\u62d4\u8303\u56f4\u3002<\/td>\n<td>\u641c\u7d22[\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u5e26]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u6ca1\u6709\u63d0\u5230\u4e1c\u6bb5\u3002\u6240\u4ee5\u6211\u9700\u8981\u67e5\u627e\u4e1c\u6bb5\u3002<\/td>\n<td>\u67e5\u627e[\u4e1c\u6bb5]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u79d1\u7f57\u62c9\u591a\u9020\u5c71\u5e26\u7684\u4e1c\u6bb5\u5ef6\u4f38\u5230\u9ad8\u5e73\u539f\u3002\u6240\u4ee5\u6211\u9700\u8981\u641c\u7d22\u9ad8\u5e73\u539f\u5e76\u627e\u5230\u5176\u6d77\u62d4\u8303\u56f4\u3002<\/td>\n<td>\u641c\u7d22[\u9ad8\u5e73\u539f]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u9ad8\u5e73\u539f\u7684\u6d77\u62d4\u4ece\u5927\u7ea61800\u82f1\u5c3a\u4e0a\u5347\u52307000\u82f1\u5c3a\uff0c\u6240\u4ee5\u7b54\u6848\u662f1800\u82f1\u5c3a\u52307000\u82f1\u5c3a\u3002<\/td>\n<td>\u5b8c\u6210[1800\u82f1\u5c3a\u52307000\u82f1\u5c3a]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td><\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>\u97f3\u4e50\u5bb6\u548c\u8bbd\u523a\u4f5c\u5bb6Allie Goertz\u4e3a&#8221;The Simpsons&#8221;\u4e2d\u7684\u89d2\u8272Milhouse\u5199\u4e86\u4e00\u9996\u6b4c\uff0cMatt Groening\u662f\u4ee5\u8c01\u7684\u540d\u5b57\u6765\u547d\u540dMilhouse\u7684\uff1f<\/td>\n<td>\u95ee\u9898\u7b80\u5316\u4e3a&#8221;The Simpsons&#8221;\u4e2d\u7684\u89d2\u8272Milhouse\u662f\u4ee5\u8c01\u7684\u540d\u5b57\u547d\u540d\u7684\u3002\u6211\u53ea\u9700\u8981\u641c\u7d22Milhouse\u5e76\u627e\u5230\u5b83\u662f\u4ee5\u8c01\u7684\u540d\u5b57\u547d\u540d\u7684\u3002<\/td>\n<td>\u641c\u7d22[Milhouse]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u6bb5\u843d\u6ca1\u6709\u8bf4\u660eMilhouse\u662f\u4ee5\u8c01\u7684\u540d\u5b57\u547d\u540d\u7684\uff0c\u4e5f\u8bb8\u6211\u53ef\u4ee5\u67e5\u627e&#8221;\u4ee5&#8230;\u547d\u540d&#8221;\u3002<\/td>\n<td>\u67e5\u627e[\u4ee5&#8230;\u547d\u540d]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Milhouse\u662f\u4ee5\u7f8e\u56fd\u603b\u7edfRichard Nixon\u7684\u540d\u5b57\u547d\u540d\u7684\uff0c\u6240\u4ee5\u7b54\u6848\u662fRichard Nixon\u3002<\/td>\n<td>\u5b8c\u6210[Richard Nixon]<\/td>\n<\/tr>\n<tr>\n<td>\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\u7eaa\u5f55\u7247\u662fAdam Clayton Powell\u8fd8\u662fThe Saimaa Gesture\uff1f<\/td>\n<td>\u6211\u9700\u8981\u641c\u7d22Adam Clayton Powell\u548cThe Saimaa Gesture\uff0c\u7136\u540e\u627e\u51fa\u54ea\u90e8\u7eaa\u5f55\u7247\u662f\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\u3002<\/td>\n<td>\u641c\u7d22[Adam Clayton Powell]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u4e3a\u4e86\u627e\u5230\u7eaa\u5f55\u7247\uff0c\u6211\u53ef\u4ee5\u641c\u7d22Adam Clayton Powell (film)\u3002<\/td>\n<td>\u641c\u7d22[Adam Clayton Powell (film)]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Adam Clayton Powell (film)\u662f\u4e00\u90e8\u5173\u4e8e\u975e\u88d4\u7f8e\u56fd\u653f\u6cbb\u5bb6\u7684\u7eaa\u5f55\u7247\uff0c\u800c\u4e0d\u662f\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\u3002\u6240\u4ee5\u5173\u4e8e\u82ac\u5170\u6447\u6eda\u4e50\u961f\u7684\u7eaa\u5f55\u7247\u5fc5\u987b\u662fThe Saimaa Gesture\u3002<\/td>\n<td>\u5b8c\u6210[The Saimaa Gesture]<\/td>\n<\/tr>\n<tr>\n<td>Nicholas Ray\u548cElia Kazan\u6709\u4ec0\u4e48\u5171\u540c\u7684\u804c\u4e1a\uff1f<\/td>\n<td>\u6211\u9700\u8981\u641c\u7d22Nicholas Ray\u548cElia Kazan\uff0c\u627e\u5230\u4ed6\u4eec\u7684\u804c\u4e1a\uff0c\u7136\u540e\u627e\u51fa\u4ed6\u4eec\u7684\u5171\u540c\u804c\u4e1a\u3002<\/td>\n<td>\u641c\u7d22[Nicholas Ray]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Nicholas Ray\u7684\u804c\u4e1a\u662f\u5bfc\u6f14\u3001\u7f16\u5267\u548c\u6f14\u5458\u3002\u6211\u63a5\u4e0b\u6765\u9700\u8981\u641c\u7d22Elia Kazan\u5e76\u627e\u5230\u4ed6\u7684\u804c\u4e1a\u3002<\/td>\n<td>\u641c\u7d22[Elia Kazan]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Elia Kazan\u7684\u804c\u4e1a\u662f\u5bfc\u6f14\u3001\u5236\u7247\u4eba\u3001\u7f16\u5267\u548c\u6f14\u5458\u3002\u6240\u4ee5Nicholas Ray\u548cElia Kazan\u7684\u5171\u540c\u804c\u4e1a\u662f\u5bfc\u6f14\u3001\u7f16\u5267\u548c\u6f14\u5458\u3002<\/td>\n<td>\u5b8c\u6210[\u5bfc\u6f14\u3001\u7f16\u5267\u3001\u6f14\u5458]<\/td>\n<\/tr>\n<tr>\n<td>\u54ea\u672c\u6742\u5fd7\u5148\u521b\u529e\u7684\uff0cArthur\u2019s Magazine\u8fd8\u662fFirst for Women\uff1f<\/td>\n<td>\u6211\u9700\u8981\u641c\u7d22Arthur\u2019s Magazine\u548cFirst for Women\uff0c\u7136\u540e\u627e\u51fa\u54ea\u672c\u6742\u5fd7\u5148\u521b\u529e\u7684\u3002<\/td>\n<td>\u641c\u7d22[Arthur\u2019s Magazine]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Arthur\u2019s Magazine\u521b\u529e\u4e8e1844\u5e74\u3002\u6211\u63a5\u4e0b\u6765\u9700\u8981\u641c\u7d22First for Women\u3002<\/td>\n<td>\u641c\u7d22[First for Women]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>First for Women\u521b\u529e\u4e8e1989\u5e74\u30021844\u5e74\uff08Arthur\u2019s Magazine\uff09&lt; 1989\u5e74\uff08First for Women\uff09\uff0c\u6240\u4ee5Arthur\u2019s Magazine\u5148\u521b\u529e\u7684\u3002<\/td>\n<td>\u5b8c\u6210[Arthur\u2019s Magazine]<\/td>\n<\/tr>\n<tr>\n<td>Pavel Urysohn\u548cLeonid Levin\u662f\u5426\u4ee5\u540c\u7c7b\u578b\u7684\u5de5\u4f5c\u800c\u95fb\u540d\uff1f<\/td>\n<td>\u6211\u9700\u8981\u641c\u7d22Pavel Urysohn\u548cLeonid Levin\uff0c\u627e\u5230\u4ed6\u4eec\u7684\u5de5\u4f5c\u7c7b\u578b\uff0c\u7136\u540e\u627e\u51fa\u4ed6\u4eec\u662f\u5426\u76f8\u540c\u3002<\/td>\n<td>\u641c\u7d22[Pavel Urysohn]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Pavel Urysohn\u662f\u4e00\u4f4d\u6570\u5b66\u5bb6\u3002\u6211\u63a5\u4e0b\u6765\u9700\u8981\u641c\u7d22Leonid Levin\u5e76\u627e\u5230\u5176\u5de5\u4f5c\u7c7b\u578b\u3002<\/td>\n<td>\u641c\u7d22[Leonid Levin]<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Leonid Levin\u662f\u4e00\u4f4d\u6570\u5b66\u5bb6\u548c\u8ba1\u7b97\u673a\u79d1\u5b66\u5bb6\u3002\u6240\u4ee5Pavel Urysohn\u548cLeonid Levin\u7684\u5de5\u4f5c\u7c7b\u578b\u76f8\u540c\u3002<\/td>\n<td>\u5b8c\u6210[\u662f]<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<h3>C.2 \u4e8b\u5b9e\u63d0\u53d6\u548c\u9a8c\u8bc1\u6570\u636e\u96c6\/FEVER<\/h3>\n<p>FEVER Prompts<\/p>\n<table width=\"810\">\n<tbody>\n<tr>\n<td colspan=\"2\" width=\"810\">Original<\/td>\n<\/tr>\n<tr>\n<td colspan=\"2\">Question\uff1aDetermine if there is Observation that SUPPORTS or REFUTES a Claim, or if there is NOT ENOUGH INFORMATION.<\/td>\n<\/tr>\n<tr>\n<td>Claim<\/td>\n<td>Answer<\/td>\n<\/tr>\n<tr>\n<td>Nikolaj Coster-Waldau worked with the Fox Broadcasting Company.<\/td>\n<td>SUPPORTS<\/td>\n<\/tr>\n<tr>\n<td>Stranger Things is set in Bloomington, Indiana.<\/td>\n<td>REFUTES<\/td>\n<\/tr>\n<tr>\n<td>Beautiful reached number two on the Billboard Hot 100 in 2003.<\/td>\n<td>NOT ENOUGH INFO<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"597\">\n<tbody>\n<tr>\n<td colspan=\"2\" width=\"597\">Original<\/td>\n<\/tr>\n<tr>\n<td colspan=\"2\">\u95ee\u9898\uff1a\u5224\u65ad\u662f\u5426\u5b58\u5728\u652f\u6301\u6216\u53cd\u9a73\u58f0\u660e\u7684\u89c2\u5bdf\u7ed3\u679c\uff0c\u6216\u8005\u662f\u5426\u4fe1\u606f\u4e0d\u8db3\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u58f0\u660e<\/td>\n<td>\u7b54\u6848<\/td>\n<\/tr>\n<tr>\n<td>\u5c3c\u53e4\u62c9\u00b7\u79d1\u65af\u7279-\u74e6\u5c14\u9053\u66fe\u4e0e\u798f\u514b\u65af\u5e7f\u64ad\u516c\u53f8\u5408\u4f5c\u3002<\/td>\n<td>\u652f\u6301<\/td>\n<\/tr>\n<tr>\n<td>\u300a\u602a\u5947\u7269\u8bed\u300b\u7684\u80cc\u666f\u8bbe\u5b9a\u5728\u5370\u7b2c\u5b89\u7eb3\u5dde\u7684\u5e03\u5362\u660e\u987f\u3002<\/td>\n<td>\u53cd\u9a73<\/td>\n<\/tr>\n<tr>\n<td>\u6b4c\u66f2\u300aBeautiful\u300b\u57282003\u5e74\u8fbe\u5230\u4e86Billboard Hot 100\u7684\u7b2c\u4e8c\u540d\u3002<\/td>\n<td>\u4fe1\u606f\u4e0d\u8db3<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"1068\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"1068\">Act<\/td>\n<\/tr>\n<tr>\n<td colspan=\"3\">Question\uff1aDetermine if there is Observation that SUPPORTS or REFUTES a Claim, or if there is NOT ENOUGH INFORMATION.<\/td>\n<\/tr>\n<tr>\n<td>Claim<\/td>\n<td>Action<\/td>\n<td>Observation<\/td>\n<\/tr>\n<tr>\n<td>Nikolaj Coster-waldau worked with the Fox Broadcasting Company.<\/td>\n<td>\u00a0Search[Nikolaj Coster-Waldau]<\/td>\n<td>Nikolaj William Coster-Waldau (born 27 July 1970) is a Danish actor and producer. He graduated from the Danish National School of Performing Arts in Copenhagen in 1993,[1] and had his breakthrough role in Denmark with the film Nightwatch (1994). He played Jaime Lannister in the HBO fantasy drama series Game of Thrones, for which he received two Primetime Emmy Award nominations for Outstanding Supporting Actor in a Drama Series.. Coster-Waldau has appeared in numerous films in his native Denmark and Scandinavia, including Headhunters (2011) and A Thousand Times Good Night (2013). In the U.S, his debut film role was in the war film Black Hawk Down (2001), playing Medal of Honor recipient Gary Gordon.[2] He then played a detective in the short-lived Fox television series New Amsterdam (2008), and appeared in the 2009 Fox television film Virtuality, originally intended as a pilot.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish[SUPPORTS]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Stranger Things is set in Bloomington, Indiana.<\/td>\n<td>Search[Stranger Things]<\/td>\n<td>Stranger Things is an American science fiction horror drama television series created by the Duffer Brothers. Set in the 1980s, primarily in the fictional town of Hawkins, Indiana, the series centers on a number of mysteries and supernatural events occurring around the town and their impact on an ensemble of child and adult characters.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish[REFUTES]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Beautiful reached number two on the Billboard Hot 100 in 2003.<\/td>\n<td>Search[Beautiful]<\/td>\n<td>Could not find [Beautiful]. Similar: [\u2019Beautiful\u2019, \u2019Beautiful, Beautiful\u2019, \u2019A Beautiful Mind (film)\u2019, \u2019Beautiful (Christina Aguilera song)\u2019, \u2019Life Is Beautiful\u2019].<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Search[Beautiful (Christina Aguilera song)<\/td>\n<td>&#8220;Beautiful&#8221; is a song recorded by American singer Christina Aguilera for her fourth studio album, Stripped (2002).<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Lookup[Billboard Hot 100]<\/td>\n<td>(Result 1 \/ 3) The song peaked at number two on the Billboard Hot 100 in the United States, where it was certified Gold for 500,000 units shipped.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Finish[NOT ENOUGH INFO]<\/td>\n<td><\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"757\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"757\">Act<\/td>\n<\/tr>\n<tr>\n<td colspan=\"3\">\u95ee\u9898\uff1a\u5224\u65ad\u662f\u5426\u6709\u89c2\u5bdf\u7ed3\u679c\u652f\u6301\u6216\u53cd\u9a73\u4e00\u4e2a\u58f0\u660e\uff0c\u6216\u8005\u662f\u5426\u4fe1\u606f\u4e0d\u8db3\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u58f0\u660e<\/td>\n<td>\u884c\u52a8<\/td>\n<td>\u89c2\u5bdf<\/td>\n<\/tr>\n<tr>\n<td>Nikolaj Coster-waldau \u66fe\u4e0e\u798f\u514b\u65af\u5e7f\u64ad\u516c\u53f8\u5408\u4f5c\u3002<\/td>\n<td>\u641c\u7d22[Nikolaj Coster-Waldau]<\/td>\n<td>Nikolaj William Coster-Waldau\uff08\u51fa\u751f\u4e8e1970\u5e747\u670827\u65e5\uff09\u662f\u4e00\u4f4d\u4e39\u9ea6\u6f14\u5458\u548c\u5236\u7247\u4eba\u3002\u4ed6\u4e8e1993\u5e74\u6bd5\u4e1a\u4e8e\u54e5\u672c\u54c8\u6839\u7684\u4e39\u9ea6\u56fd\u5bb6\u8868\u6f14\u827a\u672f\u5b66\u9662\uff0c[1] \u5e76\u5728\u4e39\u9ea6\u901a\u8fc7\u7535\u5f71\u300a\u591c\u5de1\u300b\uff081994\u5e74\uff09\u83b7\u5f97\u4e86\u7a81\u7834\u6027\u89d2\u8272\u3002\u4ed6\u5728HBO\u5e7b\u60f3\u5267\u96c6\u300a\u6743\u529b\u7684\u6e38\u620f\u300b\u4e2d\u626e\u6f14Jaime Lannister\uff0c\u56e0\u6b64\u83b7\u5f97\u4e86\u4e24\u6b21\u9ec4\u91d1\u65f6\u6bb5\u827e\u7f8e\u5956\u5267\u60c5\u7c7b\u6700\u4f73\u7537\u914d\u89d2\u63d0\u540d\u3002Coster-Waldau\u5728\u4ed6\u7684\u7956\u56fd\u4e39\u9ea6\u548c\u65af\u582a\u7684\u7eb3\u7ef4\u4e9a\u51fa\u6f14\u4e86\u4f17\u591a\u7535\u5f71\uff0c\u5305\u62ec\u300a\u730e\u5934\u300b\uff082011\u5e74\uff09\u548c\u300a\u5343\u6b21\u665a\u5b89\u300b\uff082013\u5e74\uff09\u3002\u5728\u7f8e\u56fd\uff0c\u4ed6\u7684\u9996\u90e8\u7535\u5f71\u89d2\u8272\u662f\u5728\u6218\u4e89\u7247\u300a\u9ed1\u9e70\u5760\u843d\u300b\uff082001\u5e74\uff09\u4e2d\u626e\u6f14\u8363\u8a89\u52cb\u7ae0\u83b7\u5f97\u8005Gary Gordon\u3002[2] \u4ed6\u8fd8\u66fe\u5728\u77ed\u547d\u7684\u798f\u514b\u65af\u7535\u89c6\u7cfb\u5217\u5267\u300a\u65b0\u963f\u59c6\u65af\u7279\u4e39\u300b\uff082008\u5e74\uff09\u4e2d\u626e\u6f14\u4fa6\u63a2\uff0c\u5e76\u51fa\u73b0\u57282009\u5e74\u798f\u514b\u65af\u7535\u89c6\u7535\u5f71\u300a\u865a\u62df\u4e16\u754c\u300b\u4e2d\uff0c\u8be5\u7535\u5f71\u539f\u672c\u662f\u4f5c\u4e3a\u4e00\u90e8\u8bd5\u64ad\u96c6\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210[\u652f\u6301]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>\u300a\u602a\u5947\u7269\u8bed\u300b\u7684\u80cc\u666f\u8bbe\u5b9a\u5728\u5370\u7b2c\u5b89\u7eb3\u5dde\u7684\u5e03\u5362\u660e\u987f\u3002<\/td>\n<td>\u641c\u7d22[Stranger Things]<\/td>\n<td>\u300a\u602a\u5947\u7269\u8bed\u300b\u662f\u7531\u8fbe\u592b\u5144\u5f1f\u521b\u4f5c\u7684\u7f8e\u56fd\u79d1\u5e7b\u6050\u6016\u5267\u96c6\u3002\u5267\u96c6\u8bbe\u5b9a\u57281980\u5e74\u4ee3\uff0c\u4e3b\u8981\u53d1\u751f\u5728\u865a\u6784\u7684\u5370\u7b2c\u5b89\u7eb3\u5dde\u970d\u91d1\u65af\u5c0f\u9547\uff0c\u56f4\u7ed5\u5c0f\u9547\u53d1\u751f\u7684\u4e00\u7cfb\u5217\u795e\u79d8\u548c\u8d85\u81ea\u7136\u4e8b\u4ef6\u53ca\u5176\u5bf9\u4e00\u7fa4\u513f\u7ae5\u548c\u6210\u4eba\u89d2\u8272\u7684\u5f71\u54cd\u5c55\u5f00\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210[\u53cd\u9a73]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>\u300aBeautiful\u300b\u57282003\u5e74\u8fbe\u5230\u4e86Billboard Hot 100\u7684\u7b2c\u4e8c\u540d\u3002<\/td>\n<td>\u641c\u7d22[Beautiful]<\/td>\n<td>\u672a\u627e\u5230[Beautiful]\u3002\u76f8\u4f3c\u7684\u6709\uff1a[\u2019Beautiful\u2019, \u2019Beautiful, Beautiful\u2019, \u2019A Beautiful Mind (film)\u2019, \u2019Beautiful (Christina Aguilera song)\u2019, \u2019Life Is Beautiful\u2019]\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u641c\u7d22[Beautiful (Christina Aguilera song)]<\/td>\n<td>&#8220;Beautiful&#8221;\u662f\u7f8e\u56fd\u6b4c\u624b\u514b\u91cc\u65af\u8482\u5a1c\u00b7\u963f\u594e\u83b1\u62c9\u4e3a\u5979\u4e8e2002\u5e74\u53d1\u884c\u7684\u7b2c\u56db\u5f20\u5f55\u97f3\u5ba4\u4e13\u8f91\u300aStripped\u300b\u5f55\u5236\u7684\u4e00\u9996\u6b4c\u66f2\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u67e5\u627e[Billboard Hot 100]<\/td>\n<td>\uff08\u7ed3\u679c1 \/ 3\uff09\u8fd9\u9996\u6b4c\u66f2\u5728\u7f8e\u56fdBillboard Hot 100\u4e0a\u8fbe\u5230\u4e86\u7b2c\u4e8c\u540d\uff0c\u5e76\u83b7\u5f97\u4e86500,000\u5355\u4f4d\u7684\u51fa\u8d27\u91cf\u8ba4\u8bc1\u4e3a\u91d1\u5531\u7247\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b8c\u6210[\u4fe1\u606f\u4e0d\u8db3]<\/td>\n<td><\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"1068\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"1068\">CoT<\/td>\n<\/tr>\n<tr>\n<td colspan=\"3\">Question\uff1aDetermine if there is Observation that SUPPORTS or REFUTES a Claim, or if there is NOT ENOUGH INFORMATION.<\/td>\n<\/tr>\n<tr>\n<td>Claim<\/td>\n<td>Thought<\/td>\n<td>Answer<\/td>\n<\/tr>\n<tr>\n<td>Nikolaj Coster-Waldau worked with the Fox Broadcasting Company.<\/td>\n<td>Nikolaj William Coster-Waldau appeared in the 2009 Fox television film Virtuality, so he has worked with the Fox Broadcasting Company.<\/td>\n<td>SUPPORTS<\/td>\n<\/tr>\n<tr>\n<td>Stranger Things is set in Bloomington, Indiana.<\/td>\n<td>Stranger Things is in the fictional town of Hawkins, Indiana, not in Bloomington, Indiana.<\/td>\n<td>REFUTES<\/td>\n<\/tr>\n<tr>\n<td>Beautiful reached number two on the Billboard Hot 100 in 2003.<\/td>\n<td>The song peaked at number two on the Billboard Hot 100 in the United States, but not sure if it was in 2003.<\/td>\n<td>NOT ENOUGH INFO<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"757\">\n<tbody>\n<tr>\n<td colspan=\"3\" width=\"757\">COT<\/td>\n<\/tr>\n<tr>\n<td colspan=\"3\">\u95ee\u9898\uff1a\u5224\u65ad\u662f\u5426\u5b58\u5728\u652f\u6301\u6216\u53cd\u9a73\u67d0\u4e2a\u4e3b\u5f20\u7684\u89c2\u5bdf\u7ed3\u679c\uff0c\u6216\u8005\u662f\u5426\u4fe1\u606f\u4e0d\u8db3\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u4e3b\u5f20<\/td>\n<td>\u601d\u8003<\/td>\n<td>\u7b54\u6848<\/td>\n<\/tr>\n<tr>\n<td>\u5c3c\u53e4\u62c9\u00b7\u79d1\u65af\u7279-\u74e6\u5c14\u9053\u66fe\u4e0e\u798f\u514b\u65af\u5e7f\u64ad\u516c\u53f8\u5408\u4f5c\u3002<\/td>\n<td>\u5c3c\u53e4\u62c9\u00b7\u5a01\u5ec9\u00b7\u79d1\u65af\u7279-\u74e6\u5c14\u9053\u51fa\u6f14\u4e862009\u5e74\u798f\u514b\u65af\u7535\u89c6\u7535\u5f71\u300a\u865a\u62df\u4eba\u751f\u300b\uff0c\u56e0\u6b64\u4ed6\u66fe\u4e0e\u798f\u514b\u65af\u5e7f\u64ad\u516c\u53f8\u5408\u4f5c\u3002<\/td>\n<td>\u652f\u6301<\/td>\n<\/tr>\n<tr>\n<td>\u300a\u602a\u5947\u7269\u8bed\u300b\u7684\u6545\u4e8b\u53d1\u751f\u5728\u5370\u7b2c\u5b89\u7eb3\u5dde\u7684\u5e03\u5362\u660e\u987f\u3002<\/td>\n<td>\u300a\u602a\u5947\u7269\u8bed\u300b\u7684\u6545\u4e8b\u53d1\u751f\u5728\u865a\u6784\u7684\u970d\u91d1\u65af\u9547\uff0c\u5370\u7b2c\u5b89\u7eb3\u5dde\uff0c\u800c\u4e0d\u662f\u5e03\u5362\u660e\u987f\uff0c\u5370\u7b2c\u5b89\u7eb3\u5dde\u3002<\/td>\n<td>\u53cd\u9a73<\/td>\n<\/tr>\n<tr>\n<td>\u6b4c\u66f2\u300a\u7f8e\u4e3d\u300b\u57282003\u5e74\u8fbe\u5230\u4e86\u7f8e\u56fd\u516c\u544a\u724c\u70ed\u95e8100\u5f3a\u7684\u7b2c\u4e8c\u540d\u3002<\/td>\n<td>\u8be5\u6b4c\u66f2\u5728\u7f8e\u56fd\u516c\u544a\u724c\u70ed\u95e8100\u5f3a\u4e2d\u8fbe\u5230\u4e86\u7b2c\u4e8c\u540d\uff0c\u4f46\u4e0d\u786e\u5b9a\u662f\u5426\u662f\u57282003\u5e74\u3002<\/td>\n<td>\u4fe1\u606f\u4e0d\u8db3<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"1140\">\n<tbody>\n<tr>\n<td colspan=\"4\" width=\"1140\">ReAct<\/td>\n<\/tr>\n<tr>\n<td colspan=\"4\">Question\uff1aDetermine if there is Observation that SUPPORTS or REFUTES a Claim, or if there is NOT ENOUGH INFORMATION.<\/td>\n<\/tr>\n<tr>\n<td>Claim<\/td>\n<td>Thought<\/td>\n<td>Action<\/td>\n<td>Observation<\/td>\n<\/tr>\n<tr>\n<td>Nikolaj Coster-Waldau worked with the Fox Broadcasting Company.<\/td>\n<td>I need to search Nikolaj Coster-Waldau and find if he has worked with the Fox Broadcasting Company.<\/td>\n<td>Search[Nikolaj Coster-Waldau]<\/td>\n<td>Nikolaj William Coster-Waldau (born 27 July 1970) is a Danish actor and producer. He graduated from the Danish National School of Performing Arts in Copenhagen in 1993,[1] and had his breakthrough role in Denmark with the film Nightwatch (1994). He played Jaime Lannister in the HBO fantasy drama series Game of Thrones, for which he received two Primetime Emmy Award nominations for Outstanding Supporting Actor in a Drama Series.. Coster-Waldau has appeared in numerous films in his native Denmark and Scandinavia, including Headhunters (2011) and A Thousand Times Good Night (2013). In the U.S, his debut film role was in the war film Black Hawk Down (2001), playing Medal of Honor recipient Gary Gordon.[2] He then played a detective in the short-lived Fox television series New Amsterdam (2008), and appeared in the 2009 Fox television film Virtuality, originally intended as a pilot.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>Because he &#8220;appeared in the 2009 Fox television film Virtuality&#8221;, he should have worked with the Fox Broadcasting Company.<\/td>\n<td>Finish[SUPPORTS]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Stranger Things is set in Bloomington, Indiana.<\/td>\n<td>I should search for Stranger Things, and see if it is set in Bloomington, Indiana.<\/td>\n<td>Search[Stranger Things]<\/td>\n<td>Stranger Things is an American science fiction horror drama television series created by the Duffer Brothers. Set in the 1980s, primarily in the fictional town of Hawkins, Indiana, the series centers on a number of mysteries and supernatural events occurring around the town and their impact on an ensemble of child and adult characters.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>The observation says that it is set in a &#8220;fictional town of Hawkins, Indiana&#8221;, so it is not set in Bloomington.<\/td>\n<td>Finish[REFUTES]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>Beautiful reached number two on the Billboard Hot 100 in 2003.<\/td>\n<td>I need to search the song Beautiful and find if it reached number two on the Billboard Hot 100 in 2003.<\/td>\n<td>Search[Beautiful]<\/td>\n<td>Could not find [Beautiful]. Similar: [\u2019Beautiful\u2019, \u2019Beautiful, Beautiful\u2019, \u2019A Beautiful Mind (film)\u2019, \u2019Beautiful (Christina Aguilera song)\u2019, \u2019Life Is Beautiful\u2019].<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>From suggestions, I should search &#8220;Beautiful (Christina Aguilera song)&#8221; to find the song.<\/td>\n<td>Search[Beautiful (Christina Aguilera song)]<\/td>\n<td>&#8220;Beautiful&#8221; is a song recorded by American singer Christina Aguilera for her fourth studio album, Stripped (2002).<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>It does not mention Billboard, so I need to look up &#8220;Billboard Hot 100&#8221; to find if it reached number two on it in 2003.<\/td>\n<td>Lookup[Billboard Hot 100]<\/td>\n<td>(Result 1 \/ 3) The song peaked at number two on the Billboard Hot 100 in the United States, where it was certified Gold for 500,000 units shipped.<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>It only says the song peaked at number two on the Billboard Hot 100, but not if it was in 2003. I am not sure if this claim is true or not.<\/td>\n<td>Finish[NOT ENOUGH INFO]<\/td>\n<td><\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<table width=\"829\">\n<tbody>\n<tr>\n<td colspan=\"4\" width=\"829\">\n<p data-tag-name=\"table\">ReAct<\/p>\n<\/td>\n<\/tr>\n<tr>\n<td colspan=\"4\">\u95ee\u9898\uff1a\u786e\u5b9a\u662f\u5426\u6709\u89c2\u5bdf\u7ed3\u679c\u652f\u6301\u6216\u53cd\u9a73\u4e00\u4e2a\u58f0\u660e\uff0c\u6216\u8005\u662f\u5426\u4fe1\u606f\u4e0d\u8db3\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u58f0\u660e<\/td>\n<td>\u601d\u8003<\/td>\n<td>\u884c\u52a8<\/td>\n<td>\u89c2\u5bdf<\/td>\n<\/tr>\n<tr>\n<td>\u5c3c\u53e4\u62c9\u00b7\u79d1\u65af\u7279-\u74e6\u5c14\u9053\u66fe\u4e0e\u798f\u514b\u65af\u5e7f\u64ad\u516c\u53f8\u5408\u4f5c\u3002<\/td>\n<td>\u6211\u9700\u8981\u641c\u7d22\u5c3c\u53e4\u62c9\u00b7\u79d1\u65af\u7279-\u74e6\u5c14\u9053\uff0c\u67e5\u627e\u4ed6\u662f\u5426\u4e0e\u798f\u514b\u65af\u5e7f\u64ad\u516c\u53f8\u5408\u4f5c\u8fc7\u3002<\/td>\n<td>\u641c\u7d22[\u5c3c\u53e4\u62c9\u00b7\u79d1\u65af\u7279-\u74e6\u5c14\u9053]<\/td>\n<td>\u5c3c\u53e4\u62c9\u00b7\u5a01\u5ec9\u00b7\u79d1\u65af\u7279-\u74e6\u5c14\u9053\uff08\u51fa\u751f\u4e8e1970\u5e747\u670827\u65e5\uff09\u662f\u4e00\u4f4d\u4e39\u9ea6\u6f14\u5458\u548c\u5236\u7247\u4eba\u3002\u4ed6\u4e8e1993\u5e74\u6bd5\u4e1a\u4e8e\u54e5\u672c\u54c8\u6839\u7684\u4e39\u9ea6\u56fd\u5bb6\u8868\u6f14\u827a\u672f\u5b66\u9662\uff0c[1]\uff0c\u5e76\u51ed\u501f1994\u5e74\u7684\u7535\u5f71\u300a\u591c\u73ed\u300b\u5728\u4e39\u9ea6\u53d6\u5f97\u4e86\u7a81\u7834\u6027\u7684\u89d2\u8272\u3002\u4ed6\u5728HBO\u5e7b\u60f3\u5267\u96c6\u300a\u6743\u529b\u7684\u6e38\u620f\u300b\u4e2d\u626e\u6f14\u8a79\u59c6\u00b7\u5170\u5c3c\u65af\u7279\uff0c\u56e0\u6b64\u83b7\u5f97\u4e86\u4e24\u6b21\u9ec4\u91d1\u65f6\u6bb5\u827e\u7f8e\u5956\u6700\u4f73\u5267\u60c5\u7c7b\u7537\u914d\u89d2\u63d0\u540d\u3002\u3002\u79d1\u65af\u7279-\u74e6\u5c14\u9053\u5728\u4ed6\u7684\u7956\u56fd\u4e39\u9ea6\u548c\u65af\u582a\u7684\u7eb3\u7ef4\u4e9a\u51fa\u6f14\u4e86\u4f17\u591a\u7535\u5f71\uff0c\u5305\u62ec\u300a\u730e\u5934\u4eba\u300b\uff082011\u5e74\uff09\u548c\u300a\u5343\u6b21\u665a\u5b89\u300b\uff082013\u5e74\uff09\u3002\u5728\u7f8e\u56fd\uff0c\u4ed6\u7684\u9996\u90e8\u7535\u5f71\u89d2\u8272\u662f\u5728\u6218\u4e89\u7247\u300a\u9ed1\u9e70\u5760\u843d\u300b\uff082001\u5e74\uff09\u4e2d\u626e\u6f14\u8363\u8a89\u52cb\u7ae0\u83b7\u5f97\u8005\u52a0\u91cc\u00b7\u6208\u767b\u3002[2] \u4ed6\u5728\u798f\u514b\u65af\u7535\u89c6\u77ed\u5267\u300a\u65b0\u963f\u59c6\u65af\u7279\u4e39\u300b\uff082008\u5e74\uff09\u4e2d\u626e\u6f14\u4e86\u4e00\u540d\u4fa6\u63a2\uff0c\u5e76\u51fa\u73b0\u57282009\u5e74\u798f\u514b\u65af\u7535\u89c6\u7535\u5f71\u300a\u865a\u62df\u4e16\u754c\u300b\u4e2d\uff0c\u8be5\u7535\u5f71\u539f\u672c\u662f\u4f5c\u4e3a\u4e00\u90e8\u8bd5\u64ad\u96c6\u5236\u4f5c\u7684\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u56e0\u4e3a\u4ed6\u5728\u201c2009\u5e74\u798f\u514b\u65af\u7535\u89c6\u7535\u5f71\u300a\u865a\u62df\u4e16\u754c\u300b\u201d\u4e2d\u51fa\u6f14\u8fc7\uff0c\u6240\u4ee5\u4ed6\u5e94\u8be5\u4e0e\u798f\u514b\u65af\u5e7f\u64ad\u516c\u53f8\u5408\u4f5c\u8fc7\u3002<\/td>\n<td>\u5b8c\u6210[\u652f\u6301]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>\u300a\u602a\u5947\u7269\u8bed\u300b\u7684\u6545\u4e8b\u53d1\u751f\u5728\u5370\u7b2c\u5b89\u7eb3\u5dde\u7684\u5e03\u5362\u660e\u987f\u3002<\/td>\n<td>\u6211\u5e94\u8be5\u641c\u7d22\u300a\u602a\u5947\u7269\u8bed\u300b\uff0c\u770b\u770b\u5b83\u662f\u5426\u53d1\u751f\u5728\u5370\u7b2c\u5b89\u7eb3\u5dde\u7684\u5e03\u5362\u660e\u987f\u3002<\/td>\n<td>\u641c\u7d22[\u300a\u602a\u5947\u7269\u8bed\u300b]<\/td>\n<td>\u300a\u602a\u5947\u7269\u8bed\u300b\u662f\u7531\u8fbe\u592b\u5144\u5f1f\u521b\u4f5c\u7684\u7f8e\u56fd\u79d1\u5e7b\u6050\u6016\u5267\u96c6\u3002\u8bbe\u5b9a\u57281980\u5e74\u4ee3\uff0c\u4e3b\u8981\u5728\u865a\u6784\u7684\u5370\u7b2c\u5b89\u7eb3\u5dde\u970d\u91d1\u65af\u5c0f\u9547\uff0c\u8be5\u5267\u56f4\u7ed5\u8be5\u9547\u53d1\u751f\u7684\u4e00\u7cfb\u5217\u795e\u79d8\u548c\u8d85\u81ea\u7136\u4e8b\u4ef6\u53ca\u5176\u5bf9\u4e00\u7fa4\u513f\u7ae5\u548c\u6210\u4eba\u89d2\u8272\u7684\u5f71\u54cd\u5c55\u5f00\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u89c2\u5bdf\u8868\u660e\u5b83\u662f\u8bbe\u5b9a\u5728\u201c\u865a\u6784\u7684\u970d\u91d1\u65af\u5c0f\u9547\uff0c\u5370\u7b2c\u5b89\u7eb3\u5dde\u201d\uff0c\u6240\u4ee5\u5b83\u5e76\u4e0d\u662f\u53d1\u751f\u5728\u5e03\u5362\u660e\u987f\u3002<\/td>\n<td>\u5b8c\u6210[\u53cd\u9a73]<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>\u300a\u7f8e\u4e3d\u300b\u57282003\u5e74\u8fbe\u5230\u4e86Billboard Hot 100\u7684\u7b2c\u4e8c\u540d\u3002<\/td>\n<td>\u6211\u9700\u8981\u641c\u7d22\u6b4c\u66f2\u300a\u7f8e\u4e3d\u300b\u5e76\u67e5\u627e\u5b83\u662f\u5426\u57282003\u5e74\u8fbe\u5230\u4e86Billboard Hot 100\u7684\u7b2c\u4e8c\u540d\u3002<\/td>\n<td>\u641c\u7d22[\u300a\u7f8e\u4e3d\u300b]<\/td>\n<td>\u672a\u627e\u5230[\u300a\u7f8e\u4e3d\u300b]\u3002\u76f8\u4f3c\u7684\u6709\uff1a[\u2019Beautiful\u2019, \u2019Beautiful, Beautiful\u2019, \u2019A Beautiful Mind (film)\u2019, \u2019Beautiful (Christina Aguilera song)\u2019, \u2019Life Is Beautiful\u2019]\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u4ece\u5efa\u8bae\u4e2d\uff0c\u6211\u5e94\u8be5\u641c\u7d22\u201c\u514b\u91cc\u65af\u8482\u5a1c\u00b7\u963f\u594e\u83b1\u62c9\u7684\u6b4c\u66f2\u300a\u7f8e\u4e3d\u300b\u201d\u6765\u627e\u5230\u8fd9\u9996\u6b4c\u3002<\/td>\n<td>\u641c\u7d22[\u514b\u91cc\u65af\u8482\u5a1c\u00b7\u963f\u594e\u83b1\u62c9\u7684\u6b4c\u66f2\u300a\u7f8e\u4e3d\u300b]<\/td>\n<td>\u201c\u7f8e\u4e3d\u201d\u662f\u7f8e\u56fd\u6b4c\u624b\u514b\u91cc\u65af\u8482\u5a1c\u00b7\u963f\u594e\u83b1\u62c9\u4e3a\u5979\u4e8e2002\u5e74\u53d1\u884c\u7684\u7b2c\u56db\u5f20\u5f55\u97f3\u5ba4\u4e13\u8f91\u300aStripped\u300b\u5f55\u5236\u7684\u4e00\u9996\u6b4c\u66f2\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b83\u5e76\u6ca1\u6709\u63d0\u5230Billboard\uff0c\u6240\u4ee5\u6211\u9700\u8981\u67e5\u627e\u201cBillboard Hot 100\u201d\u6765\u786e\u8ba4\u5b83\u662f\u5426\u57282003\u5e74\u8fbe\u5230\u4e86\u7b2c\u4e8c\u540d\u3002<\/td>\n<td>\u67e5\u627e[Billboard Hot 100]<\/td>\n<td>\uff08\u7ed3\u679c1 \/ 3\uff09\u8fd9\u9996\u6b4c\u66f2\u5728\u7f8e\u56fdBillboard Hot 100\u699c\u5355\u4e0a\u8fbe\u5230\u4e86\u7b2c\u4e8c\u540d\u7684\u9ad8\u5cf0\uff0c\u5e76\u4e14\u5728\u90a3\u91cc\u83b7\u5f97\u4e86500,000\u5355\u4f4d\u7684\u91d1\u5531\u7247\u8ba4\u8bc1\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td>\u5b83\u53ea\u63d0\u5230\u8fd9\u9996\u6b4c\u66f2\u5728Billboard Hot 100\u4e0a\u8fbe\u5230\u4e86\u7b2c\u4e8c\u540d\uff0c\u4f46\u6ca1\u6709\u63d0\u5230\u662f\u5426\u662f\u57282003\u5e74\u3002\u6211\u4e0d\u786e\u5b9a\u8fd9\u4e2a\u58f0\u660e\u662f\u771f\u662f\u5047\u3002<\/td>\n<td>\u5b8c\u6210[\u4fe1\u606f\u4e0d\u8db3]<\/td>\n<td><\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>&nbsp;<\/p>\n<h3>C.3 \u7f51\u7edc\u8d2d\u7269<\/h3>\n<p><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2535\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-11\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/55506240b421bf0.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-11\" width=\"651\" height=\"771\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/55506240b421bf0.png 651w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/55506240b421bf0-253x300.png 253w\" sizes=\"auto, (max-width: 651px) 100vw, 651px\" \/><\/p>\n<p>\u8868\u683c 6: \u7b2c 4 \u7ae0\u8282\u4e2d\u7528\u4e8e\u7f51\u7edc\u5546\u5e97\u5b9e\u9a8c\u7684\u63d0\u793a\u8bed\u3002\u6211\u4eec\u4f7f\u7528\u5de6\u4fa7\u7684\u63d0\u793a\u8bed\u8fdb\u884c\u884c\u52a8(Act)\uff0c\u5e76\u4f7f\u7528\u53f3\u4fa7\u7684\u63d0\u793a\u8bed\uff08\u6dfb\u52a0\u63a8\u7406\uff09\u8fdb\u884c\u53cd\u5e94(ReAct)\u3002<\/p>\n<div class=\"markdown-preview-pusher\"><\/div>\n<div class=\"el-table\" data-tag-name=\"table\">\n<table>\n<thead>\n<tr>\n<th><strong>\u6307\u4ee4\uff1a<\/strong>\u6211\u60f3\u8981\u4e00\u74f63\u76ce\u53f8\u7684\u4eae\u67d1\u6a58\u9999\u578b\u654f\u611f\u808c\u80a4\u7528\u9664\u81ed\u5242\uff0c\u4ef7\u683c\u4f4e\u4e8e50.00\u7f8e\u5143<\/th>\n<th><\/th>\n<th><\/th>\n<th><\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>Act<\/td>\n<td><\/td>\n<td>ReAct<\/td>\n<td><\/td>\n<\/tr>\n<tr>\n<td>\u52a8\u4f5c<\/td>\n<td>\u89c2\u5bdf<\/td>\n<td>\u52a8\u4f5c<\/td>\n<td>\u89c2\u5bdf<\/td>\n<\/tr>\n<tr>\n<td>\u641c\u7d22[3\u76ce\u53f8\u4eae\u67d1\u6a58\u9999\u578b\u654f\u611f\u808c\u80a4\u7528\u9664\u81ed\u5242]<\/td>\n<td>[\u8fd4\u56de\u641c\u7d22]<br \/>\n\u7b2c1\u9875 (\u603b\u7ed3\u679c\u6570\uff1a50)[\u4e0b\u4e00\u9875][B078GWRC1J]<br \/>\nEarth Mama\u7684\u4eae\u67d1\u6a58\u9664\u81ed\u5242 | \u5929\u7136\u4e14\u9002\u7528\u4e8e<br \/>\n\u654f\u611f\u808c\u80a4\u3001\u5b55\u671f\u548c\u54fa\u4e73\u671f\uff0c\u542b\u6709\u6709\u673a<br \/>\n\u91d1\u76cf\u82b1 3\u76ce\u53f8<br \/>\n$10.99[B078GTKVXY]<br \/>\nEarth Mama\u7684\u59dc\u5473\u6e05\u65b0\u9664\u81ed\u5242 | \u5929\u7136\u4e14\u9002\u7528\u4e8e<br \/>\n\u654f\u611f\u808c\u80a4\u3001\u5b55\u671f\u548c\u54fa\u4e73\u671f\uff0c\u542b\u6709\u6709\u673a<br \/>\n\u91d1\u76cf\u82b1 3\u76ce\u53f8<br \/>\n$10.99[B08KBVJ4XN]<br \/>\nBarrel and Oak &#8211; \u65e0\u94dd\u9664\u81ed\u5242\uff0c\u7537\u58eb\u7528<br \/>\n\u57fa\u4e8e\u7cbe\u6cb9\u7684\u9999\u5473\uff0c24\u5c0f\u65f6\u9632\u81ed\uff0c\u96ea\u677e<br \/>\n&amp; \u5e7f\u85ff\u9999\u6df7\u5408\uff0c\u6e29\u548c\u9002\u5408\u654f\u611f\u808c\u80a4\uff08\u5c71 sage\uff0c<br \/>\n2.7\u76ce\u53f8\uff0c2\u74f6\u88c5\uff09<br \/>\n$15.95<\/td>\n<td>\u641c\u7d22 3\u76ce\u53f8\u4eae\u67d1\u6a58\u9999\u578b\u654f\u611f\u808c\u80a4\u7528\u9664\u81ed\u5242<\/td>\n<td>[\u8fd4\u56de\u641c\u7d22]<br \/>\n\u7b2c1\u9875 (\u603b\u7ed3\u679c\u6570\uff1a50)[\u4e0b\u4e00\u9875][B078GWRC1J]<br \/>\nEarth Mama\u7684\u4eae\u67d1\u6a58\u9664\u81ed\u5242 | \u5929\u7136\u4e14\u9002\u7528\u4e8e<br \/>\n\u654f\u611f\u808c\u80a4\u3001\u5b55\u671f\u548c\u54fa\u4e73\u671f\uff0c\u542b\u6709\u6709\u673a<br \/>\n\u91d1\u76cf\u82b1 3\u76ce\u53f8<br \/>\n$10.99[B078GTKVXY]<br \/>\nEarth Mama\u7684\u59dc\u5473\u6e05\u65b0\u9664\u81ed\u5242 | \u5929\u7136\u4e14\u9002\u7528\u4e8e<br \/>\n\u654f\u611f\u808c\u80a4\u3001\u5b55\u671f\u548c\u54fa\u4e73\u671f\uff0c\u542b\u6709\u6709\u673a<br \/>\n\u91d1\u76cf\u82b1 3\u76ce\u53f8<br \/>\n$10.99[B08KBVJ4XN]<br \/>\nBarrel and Oak &#8211; \u65e0\u94dd\u9664\u81ed\u5242\uff0c\u7537\u58eb\u7528<br \/>\n\u57fa\u4e8e\u7cbe\u6cb9\u7684\u9999\u5473\uff0c24\u5c0f\u65f6\u9632\u81ed\uff0c\u96ea\u677e<br \/>\n&amp; \u5e7f\u85ff\u9999\u6df7\u5408\uff0c\u6e29\u548c\u9002\u5408\u654f\u611f\u808c\u80a4\uff08\u5c71 sage\uff0c<br \/>\n2.7\u76ce\u53f8\uff0c2\u74f6\u88c5\uff09<br \/>\n$15.95<\/td>\n<\/tr>\n<tr>\n<td>\u70b9\u51fb[B078GWRC1J]<\/td>\n<td>\u8fd4\u56de\u641c\u7d22\u4e0a\u4e00\u9875<br \/>\n\u9999\u5473 [\u591a\u79cd\u9999\u5473][\u4eae\u67d1\u6a58][\u5b89\u629a\u85b0\u8863\u8349]\u59dc<br \/>\n[\u6e05\u65b0] \u7b80\u5355\u65e0\u9999]<br \/>\n\u5c3a\u5bf8 [\u65c5\u884c\u5957\u88c5 (4\u74f6\u88c5)][3\u76ce\u53f8 (1\u74f6\u88c5)][3\u76ce\u53f8 (2<br \/>\n\u74f6\u88c5)]<br \/>\nEarth Mama\u7684\u4eae\u67d1\u6a58\u9664\u81ed\u5242 | \u5929\u7136\u4e14\u9002\u7528\u4e8e<br \/>\n\u654f\u611f\u808c\u80a4\u3001\u5b55\u671f\u548c\u54fa\u4e73\u671f\uff0c\u542b\u6709\u6709\u673a<br \/>\n\u91d1\u76cf\u82b1 3\u76ce\u53f8<br \/>\n\u4ef7\u683c\uff1a$10.99<br \/>\n\u8bc4\u5206\uff1aN.A.<br \/>\n[\u63cf\u8ff0]<br \/>\n[\u7279\u70b9]<br \/>\n[\u8bc4\u8bba]<br \/>\n[\u7acb\u5373\u8d2d\u4e70]<\/td>\n<td>\u601d\u8003[B078GWRC1J\u548cB078GTKVXY\u662f\u4eae\u67d1\u6a58\u9999\u578b\u7684\u9664\u81ed\u5242\uff0c\u4ef7\u683c\u4f4e\u4e8e50\u7f8e\u5143\u3002\u6211\u53ef\u4ee5\u5148\u68c0\u67e5B078GWRC1J\u3002]<\/td>\n<td>\u597d\u7684\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u70b9\u51fb[\u4eae\u67d1\u6a58]<\/td>\n<td>\u60a8\u5df2\u70b9\u51fb\u4eae\u67d1\u6a58\u3002<\/td>\n<td>\u70b9\u51fb[B078GWRC1J]<\/td>\n<td>[\u8fd4\u56de\u641c\u7d22][\u4e0a\u4e00\u9875]<br \/>\n\u9999\u5473 [\u591a\u79cd\u9999\u5473][\u4eae\u67d1\u6a58][\u5b89\u629a\u85b0\u8863\u8349]\u59dc<br \/>\n[\u6e05\u65b0] \u7b80\u5355\u65e0\u9999]<br \/>\n\u5c3a\u5bf8 [\u65c5\u884c\u5957\u88c5 (4\u74f6\u88c5)][3\u76ce\u53f8 (1\u74f6\u88c5)][3\u76ce\u53f8 (2<br \/>\n\u74f6\u88c5)]<br \/>\nEarth Mama\u7684\u4eae\u67d1\u6a58\u9664\u81ed\u5242 | \u5929\u7136\u4e14\u9002\u7528\u4e8e<br \/>\n\u654f\u611f\u808c\u80a4\u3001\u5b55\u671f\u548c\u54fa\u4e73\u671f\uff0c\u542b\u6709\u6709\u673a<br \/>\n\u91d1\u76cf\u82b1 3\u76ce\u53f8<br \/>\n\u4ef7\u683c\uff1a$10.99<br \/>\n\u8bc4\u5206\uff1aN.A.<br \/>\n[\u63cf\u8ff0]<br \/>\n[\u7279\u70b9]<br \/>\n[\u8bc4\u8bba]<br \/>\n[\u7acb\u5373\u8d2d\u4e70]<\/td>\n<\/tr>\n<tr>\n<td>\u70b9\u51fb[3\u76ce\u53f8 (1\u74f6\u88c5)]<\/td>\n<td>\u60a8\u5df2\u70b9\u51fb3\u76ce\u53f8 (1\u74f6\u88c5)\u3002<\/td>\n<td>\u601d\u8003[\u5bf9\u4e8e3\u76ce\u53f8\u74f6\u88c5\u7684\u4eae\u67d1\u6a58\u9999\u578b\u654f\u611f\u808c\u80a4\u7528\u9664\u81ed\u5242\uff0c\u5546\u54c1\u6709&#8217;\u4eae\u67d1\u6a58&#8217;\u548c&#8217;3\u76ce\u53f8 (1\u74f6\u88c5)&#8217;\u7684\u9009\u9879\uff0c\u770b\u8d77\u6765\u53ef\u4ee5\u8d2d\u4e70\u3002]<\/td>\n<td>\u597d\u7684\u3002<\/td>\n<\/tr>\n<tr>\n<td>\u70b9\u51fb[\u7acb\u5373\u8d2d\u4e70]<\/td>\n<td><\/td>\n<td>\u70b9\u51fb[\u4eae\u67d1\u6a58]<\/td>\n<td>\u60a8\u5df2\u70b9\u51fb\u4eae\u67d1\u6a58\u3002<\/td>\n<\/tr>\n<tr>\n<td><\/td>\n<td><\/td>\n<td>\u70b9\u51fb[3\u76ce\u53f8 (1\u74f6\u88c5)]<\/td>\n<td>\u60a8\u5df2\u70b9\u51fb3\u76ce\u53f8 (1\u74f6\u88c5)\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<\/div>\n<p>&nbsp;<\/p>\n<h3>C.4 ALFWORLD<\/h3>\n<p>ALFWORLD\u6a21\u62df\u5668,\u8be5\u73af\u5883\u5305\u542b\u8d85\u8fc725000\u4e2a\u72ec\u7279\u7684\u3001\u7a0b\u5e8f\u751f\u6210\u7684\u4efb\u52a1\uff0c\u6db5\u76d6\u53a8\u623f\u3001\u5ba2\u5385\u3001\u5367\u5ba4\u7b49\u771f\u5b9e\u73af\u5883\u3002<\/p>\n<blockquote><p>You are in the middle of a room. Looking quickly around you, you see a cabinet<br \/>\n13, a cabinet 12, a cabinet 11, a cabinet 10, a cabinet 9, a cabinet 8, a cabinet<br \/>\n7, a cabinet 6, a cabinet 5, a cabinet 4, a cabinet 3, a cabinet 2, a cabinet<br \/>\n1, a coffeemachine 1, a countertop 1, a diningtable 1, a drawer 1, a fridge 1, a<br \/>\ngarbagecan 1, a microwave 1, a shelf 3, a shelf 2, a shelf 1, a sinkbasin 1, a<br \/>\nstoveburner 4, a stoveburner 3, a stoveburner 2, a stoveburner 1, and a toaster 1.<br \/>\nYour task is to: put a clean lettuce in diningtable.<br \/>\n&gt; go to fridge 1<br \/>\nThe fridge 1 is closed.<br \/>\n&gt; open fridge 1<br \/>\nYou open the fridge 1. The fridge 1 is open. In it, you see a cup 3, a egg 2, a<br \/>\npotato 3, and a potato 2.<br \/>\n&gt; go to diningtable 1<br \/>\nOn the diningtable 1, you see a apple 1, a bread 1, a butterknife 2, a cup 2, a<br \/>\nfork 2, a knife 2, a knife 1, a ladle 1, a lettuce 1, a mug 2, a mug 1, a pan 2, a<br \/>\npeppershaker 1, a spatula 3, a tomato 2, and a tomato 1.<br \/>\n&gt; take lettuce 1 from diningtable 1<br \/>\nYou pick up the lettuce 1 from the diningtable 1.<br \/>\n&gt; go to sinkbasin 1<br \/>\nOn the sinkbasin 1, you see a apple 2, a ladle 2, a spoon 1, and a tomato 3.<br \/>\n&gt; clean lettuce 1 with sinkbasin 1<br \/>\nYou clean the lettuce 1 using the sinkbasin 1.<br \/>\n&gt; think: Now I clean a lettuce (1). Next, I need to put it in\/on diningtable 1.<br \/>\nOK.<br \/>\n&gt; go to diningtable 1<br \/>\nOn the diningtable 1, you see a apple 1, a bread 1, a butterknife 2, a cup 2, a fork<br \/>\n2, a knife 2, a knife 1, a ladle 1, a mug 2, a mug 1, a pan 2, a peppershaker 1, a<br \/>\nspatula 3, a tomato 2, and a tomato 1.<br \/>\n&gt; put lettuce 1 in\/on diningtable 1<br \/>\nYou put the lettuce 1 in\/on the diningtable 1.<\/p><\/blockquote>\n<p>\u88687\uff1a\u5173\u4e8eALFWorld\u6e05\u6d01\u4efb\u52a1\u7684\u884c\u52a8\u63d0\u793a\u3002\u6ca1\u6709\u63d0\u4f9b\u60f3\u6cd5\u3002<\/p>\n<p>&nbsp;<\/p>\n<blockquote><p>\u4f60\u5728\u4e00\u4e2a\u623f\u95f4\u7684\u4e2d\u95f4\u3002\u5feb\u901f\u73af\u987e\u56db\u5468\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u67dc\u5b50<br \/>\n13\u3001\u67dc\u5b5012\u3001\u67dc\u5b5011\u3001\u67dc\u5b5010\u3001\u67dc\u5b509\u3001\u67dc\u5b508\u3001\u67dc\u5b50<br \/>\n7\u3001\u67dc\u5b506\u3001\u67dc\u5b505\u3001\u67dc\u5b504\u3001\u67dc\u5b503\u3001\u67dc\u5b502\u3001\u67dc\u5b50<br \/>\n1\u3001\u5496\u5561\u673a1\u53f0\u3001\u53f0\u97621\u3001\u9910\u684c1\u3001\u62bd\u5c491\u3001\u51b0\u7bb11\u3001<br \/>\n\u5783\u573e\u68761\u4e2a\u3001\u5fae\u6ce2\u70891\u4e2a\u3001\u67b6\u5b503\u4e2a\u3001\u67b6\u5b502\u4e2a\u3001\u67b6\u5b501\u4e2a\u3001\u6c34\u69fd1\u4e2a\u3001<br \/>\n\u7089\u70764\u3001\u7089\u70763\u3001\u7089\u70762\u3001\u7089\u70761\u548c\u70e4\u9762\u5305\u673a1\u3002<br \/>\n\u4f60\u7684\u4efb\u52a1\u662f\uff1a\u5c06\u5e72\u51c0\u7684\u751f\u83dc\u653e\u5165\u9910\u684c\u3002<br \/>\n&gt; \u524d\u5f80\u51b0\u7bb1 1<br \/>\n\u51b0\u7bb11\u5173\u95ed\u3002<br \/>\n&gt; \u6253\u5f00\u51b0\u7bb1 1<br \/>\n\u60a8\u6253\u5f00\u51b0\u7bb1 1\u3002\u51b0\u7bb1 1 \u5df2\u6253\u5f00\u3002\u5728\u5176\u4e2d\uff0c\u60a8\u53ef\u4ee5\u770b\u5230\u4e00\u4e2a\u676f\u5b50 3\u3001\u4e00\u4e2a\u9e21\u86cb 2\u3001\u4e00\u4e2a<br \/>\n\u9a6c\u94c3\u85af3\u4e2a\uff0c\u9a6c\u94c3\u85af2\u4e2a\u3002<br \/>\n&gt; \u524d\u5f80\u9910\u684c 1<br \/>\n\u5728\u9910\u684c 1 \u4e0a\uff0c\u60a8\u53ef\u4ee5\u770b\u5230\u4e00\u4e2a\u82f9\u679c 1\u3001\u4e00\u4e2a\u9762\u5305 1\u3001\u4e00\u628a\u5976\u6cb9\u5200 2\u3001\u4e00\u4e2a\u676f\u5b50 2\u3001\u4e00\u4e2a<br \/>\n\u53c9\u5b50 2\u3001\u5200 2\u3001\u5200 1\u3001\u957f\u67c4\u52fa 1\u3001\u751f\u83dc 1\u3001\u676f\u5b50 2\u3001\u676f\u5b50 1\u3001\u5e73\u5e95\u9505 2\u3001<br \/>\n\u80e1\u6912\u74f6 1 \u4e2a\u3001\u62b9\u5200 3 \u4e2a\u3001\u756a\u8304 2 \u4e2a\u3001\u756a\u8304 1 \u4e2a\u3002<br \/>\n&gt; \u4ece\u9910\u684c 1 \u4e2d\u53d6\u51fa\u751f\u83dc 1<br \/>\n\u4f60\u4ece\u9910\u684c 1 \u62ff\u8d77\u751f\u83dc 1\u3002<br \/>\n&gt; \u524d\u5f80\u6c34\u69fd 1<br \/>\n\u5728\u6c34\u69fd 1 \u4e0a\uff0c\u60a8\u53ef\u4ee5\u770b\u5230\u4e00\u4e2a\u82f9\u679c 2\u3001\u4e00\u4e2a\u957f\u67c4\u52fa 2\u3001\u4e00\u4e2a\u52fa\u5b50 1 \u548c\u4e00\u4e2a\u756a\u8304 3\u3002<br \/>\n&gt; \u6e05\u6d17\u751f\u83dc 1 \u4e2a\uff0c\u5e26\u6c34\u69fd 1 \u4e2a<br \/>\n\u60a8\u4f7f\u7528\u6c34\u69fd 1 \u6e05\u6d17\u751f\u83dc 1\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u73b0\u5728\u6211\u6e05\u6d17\u4e00\u9897\u751f\u83dc (1)\u3002\u63a5\u4e0b\u6765\uff0c\u6211\u9700\u8981\u5c06\u5176\u653e\u5165\u9910\u684c 1 \u4e2d\/\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u9910\u684c 1<br \/>\n\u5728\u9910\u684c 1 \u4e0a\uff0c\u60a8\u53ef\u4ee5\u770b\u5230\u82f9\u679c 1\u3001\u9762\u5305 1\u3001\u9ec4\u6cb9\u5200 2\u3001\u676f\u5b50 2\u3001\u53c9\u5b50<br \/>\n2\u3001\u5200 2\u3001\u5200 1\u3001\u957f\u67c4\u52fa 1\u3001\u676f\u5b50 2\u3001\u676f\u5b50 1\u3001\u5e73\u5e95\u9505 2\u3001\u80e1\u6912\u74f6 1\u3001<br \/>\n\u62b9\u5200 3 \u4e2a\u3001\u756a\u8304 2 \u4e2a\u3001\u756a\u8304 1 \u4e2a\u3002<br \/>\n&gt; \u5c06\u751f\u83dc 1 \u653e\u5165\u9910\u684c 1 \u4e2d\/\u4e0a<br \/>\n\u60a8\u5c06\u751f\u83dc 1 \u653e\u5165\/\u653e\u5728\u9910\u684c 1 \u4e0a\u3002<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p>You are in the middle of a room. Looking quickly around you, you see a cabinet<br \/>\n13, a cabinet 12, a cabinet 11, a cabinet 10, a cabinet 9, a cabinet 8, a cabinet<br \/>\n7, a cabinet 6, a cabinet 5, a cabinet 4, a cabinet 3, a cabinet 2, a cabinet<br \/>\n1, a coffeemachine 1, a countertop 1, a diningtable 1, a drawer 1, a fridge 1, a<br \/>\ngarbagecan 1, a microwave 1, a shelf 3, a shelf 2, a shelf 1, a sinkbasin 1, a<br \/>\nstoveburner 4, a stoveburner 3, a stoveburner 2, a stoveburner 1, and a toaster 1.<br \/>\nYour task is to: put a clean lettuce in diningtable.<br \/>\n&gt; think: To solve the task, I need to find and take a lettuce, then clean it with<br \/>\nsinkbasin, then put it in diningtable.<br \/>\nOK.<br \/>\n&gt; think: First I need to find a lettuce. A lettuce is more likely to appear in<br \/>\nfridge (1), diningtable (1), sinkbasin (1), stoveburner (1-3), cabinet (1-13). I<br \/>\ncan check one by one, starting with fridge 1.<br \/>\nOK.<br \/>\n&gt; go to fridge 1<br \/>\nThe fridge 1 is closed.<br \/>\n&gt; open fridge 1<br \/>\nYou open the fridge 1. The fridge 1 is open. In it, you see a cup 3, a egg 2, a<br \/>\npotato 3, and a potato 2.<br \/>\n&gt; go to diningtable 1<br \/>\nOn the diningtable 1, you see a apple 1, a bread 1, a butterknife 2, a cup 2, a<br \/>\nfork 2, a knife 2, a knife 1, a ladle 1, a lettuce 1, a mug 2, a mug 1, a pan 2, a<br \/>\npeppershaker 1, a spatula 3, a tomato 2, and a tomato 1.<br \/>\n&gt; think: Now I find a lettuce (1). Next, I need to take it.<br \/>\nOK.<br \/>\n&gt; take lettuce 1 from diningtable 1<br \/>\nYou pick up the lettuce 1 from the diningtable 1.<br \/>\n&gt; think: Now I take a lettuce (1). Next, I need to go to sinkbasin (1) and clean<br \/>\nit.<br \/>\nOK.<br \/>\n&gt; go to sinkbasin 1<br \/>\nOn the sinkbasin 1, you see a apple 2, a ladle 2, a spoon 1, and a tomato 3.<br \/>\n&gt; clean lettuce 1 with sinkbasin 1<br \/>\nYou clean the lettuce 1 using the sinkbasin 1.<br \/>\n&gt; think: Now I clean a lettuce (1). Next, I need to put it in\/on diningtable 1.<br \/>\nOK.<br \/>\n&gt; go to diningtable 1<br \/>\nOn the diningtable 1, you see a apple 1, a bread 1, a butterknife 2, a cup 2, a fork<br \/>\n2, a knife 2, a knife 1, a ladle 1, a mug 2, a mug 1, a pan 2, a peppershaker 1, a<br \/>\nspatula 3, a tomato 2, and a tomato 1.<br \/>\n&gt; put lettuce 1 in\/on diningtable 1<br \/>\nYou put the lettuce 1 in\/on the diningtable 1.<\/p><\/blockquote>\n<p>\u88688\uff1a\u5173\u4e8eALFWorld\u6e05\u6d01\u4efb\u52a1\u7684ReAct\u884c\u52a8\u63d0\u793a\u3002<\/p>\n<p>&nbsp;<\/p>\n<blockquote><p>\u4f60\u5728\u4e00\u4e2a\u623f\u95f4\u7684\u4e2d\u592e\u3002\u5feb\u901f\u73af\u987e\u56db\u5468\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u6a71\u67dc13\u3001\u4e00\u4e2a\u6a71\u67dc12\u3001\u4e00\u4e2a\u6a71\u67dc11\u3001\u4e00\u4e2a\u6a71\u67dc10\u3001\u4e00\u4e2a\u6a71\u67dc9\u3001\u4e00\u4e2a\u6a71\u67dc8\u3001\u4e00\u4e2a\u6a71\u67dc7\u3001\u4e00\u4e2a\u6a71\u67dc6\u3001\u4e00\u4e2a\u6a71\u67dc5\u3001\u4e00\u4e2a\u6a71\u67dc4\u3001\u4e00\u4e2a\u6a71\u67dc3\u3001\u4e00\u4e2a\u6a71\u67dc2\u548c\u4e00\u4e2a\u6a71\u67dc1\u3001\u4e00\u4e2a\u5496\u5561\u673a1\u3001\u4e00\u4e2a\u53f0\u97621\u3001\u4e00\u4e2a\u9910\u684c1\u3001\u4e00\u4e2a\u62bd\u5c491\u3001\u4e00\u4e2a\u51b0\u7bb11\u3001\u4e00\u4e2a\u5783\u573e\u68761\u3001\u4e00\u4e2a\u5fae\u6ce2\u70891\u3001\u4e00\u4e2a\u67b6\u5b503\u3001\u4e00\u4e2a\u67b6\u5b502\u3001\u4e00\u4e2a\u67b6\u5b501\u3001\u4e00\u4e2a\u6d17\u624b\u76c61\u3001\u4e00\u4e2a\u7089\u59344\u3001\u4e00\u4e2a\u7089\u59343\u3001\u4e00\u4e2a\u7089\u59342\u3001\u4e00\u4e2a\u7089\u59341\u548c\u4e00\u53f0\u70e4\u9762\u5305\u673a1\u3002<br \/>\n\u4f60\u7684\u4efb\u52a1\u662f\uff1a\u5728\u9910\u684c\u4e0a\u653e\u4e00\u9897\u5e72\u51c0\u7684\u751f\u83dc\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u8981\u89e3\u51b3\u8fd9\u4e2a\u4efb\u52a1\uff0c\u6211\u9700\u8981\u627e\u5230\u5e76\u62ff\u4e00\u9897\u751f\u83dc\uff0c\u7136\u540e\u5728\u6d17\u624b\u76c6\u91cc\u6e05\u6d17\uff0c\u6700\u540e\u653e\u5728\u9910\u684c\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u9996\u5148\u6211\u9700\u8981\u627e\u5230\u4e00\u9897\u751f\u83dc\u3002\u751f\u83dc\u66f4\u53ef\u80fd\u51fa\u73b0\u5728\u51b0\u7bb1\uff081\uff09\u3001\u9910\u684c\uff081\uff09\u3001\u6d17\u624b\u76c6\uff081\uff09\u3001\u7089\u5934\uff081-3\uff09\u3001\u6a71\u67dc\uff081-13\uff09\u91cc\u3002\u6211\u53ef\u4ee5\u4e00\u4e2a\u4e00\u4e2a\u68c0\u67e5\uff0c\u4ece\u51b0\u7bb11\u5f00\u59cb\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u53bb\u51b0\u7bb11<br \/>\n\u51b0\u7bb11\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u6253\u5f00\u51b0\u7bb11<br \/>\n\u4f60\u6253\u5f00\u4e86\u51b0\u7bb11\u3002\u51b0\u7bb11\u73b0\u5728\u662f\u5f00\u7740\u7684\u3002\u5728\u91cc\u8fb9\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u676f\u5b503\u3001\u4e00\u4e2a\u9e21\u86cb2\u3001\u4e00\u4e2a\u571f\u8c463\u548c\u4e00\u4e2a\u571f\u8c462\u3002<br \/>\n&gt; \u53bb\u9910\u684c1<br \/>\n\u5728\u9910\u684c1\u4e0a\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u82f9\u679c1\u3001\u4e00\u4e2a\u9762\u53051\u3001\u4e00\u628a\u9ec4\u6cb9\u52002\u3001\u4e00\u4e2a\u676f\u5b502\u3001\u4e00\u4e2a\u53c9\u5b502\u3001\u4e00\u4e2a\u52002\u3001\u4e00\u4e2a\u52001\u3001\u4e00\u4e2a\u52fa\u5b501\u3001\u4e00\u4e2a\u9505\u94f21\u3001\u4e00\u4e2a\u751f\u83dc1\u3001\u4e00\u4e2a\u9a6c\u514b\u676f2\u3001\u4e00\u4e2a\u9a6c\u514b\u676f1\u3001\u4e00\u4e2a\u5e73\u5e95\u95052\u3001\u4e00\u4e2a\u80e1\u6912\u74f61\u3001\u4e00\u4e2a\u52fa\u5b503\u3001\u4e00\u4e2a\u756a\u83042\u548c\u4e00\u4e2a\u756a\u83041\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u73b0\u5728\u6211\u627e\u5230\u4e86\u4e00\u9897\u751f\u83dc\uff081\uff09\u3002\u63a5\u4e0b\u6765\uff0c\u6211\u9700\u8981\u62ff\u8d70\u5b83\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u4ece\u9910\u684c1\u62ff\u8d70\u751f\u83dc1<br \/>\n\u4f60\u4ece\u9910\u684c1\u4e0a\u62ff\u8d77\u4e86\u751f\u83dc1\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u73b0\u5728\u6211\u62ff\u8d70\u4e86\u4e00\u9897\u751f\u83dc\uff081\uff09\u3002\u63a5\u4e0b\u6765\uff0c\u6211\u9700\u8981\u53bb\u6d17\u624b\u76c6\uff081\uff09\u6e05\u6d17\u5b83\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u53bb\u6d17\u624b\u76c61<br \/>\n\u5728\u6d17\u624b\u76c61\u4e0a\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u82f9\u679c2\u3001\u4e00\u4e2a\u9505\u94f22\u3001\u4e00\u4e2a\u52fa\u5b501\u548c\u4e00\u4e2a\u756a\u83043\u3002<br \/>\n&gt; \u7528\u6d17\u624b\u76c61\u6e05\u6d17\u751f\u83dc1<br \/>\n\u4f60\u7528\u6d17\u624b\u76c61\u6e05\u6d17\u4e86\u751f\u83dc1\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u73b0\u5728\u6211\u6e05\u6d17\u4e86\u4e00\u9897\u751f\u83dc\uff081\uff09\u3002\u63a5\u4e0b\u6765\uff0c\u6211\u9700\u8981\u628a\u5b83\u653e\u5728\/\u4e0a\u9910\u684c\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u53bb\u9910\u684c1<br \/>\n\u5728\u9910\u684c1\u4e0a\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u82f9\u679c1\u3001\u4e00\u4e2a\u9762\u53051\u3001\u4e00\u628a\u9ec4\u6cb9\u52002\u3001\u4e00\u4e2a\u676f\u5b502\u3001\u4e00\u4e2a\u53c9\u5b502\u3001\u4e00\u4e2a\u52002\u3001\u4e00\u4e2a\u52001\u3001\u4e00\u4e2a\u52fa\u5b501\u3001\u4e00\u4e2a\u9a6c\u514b\u676f2\u3001\u4e00\u4e2a\u9a6c\u514b\u676f1\u3001\u4e00\u4e2a\u5e73\u5e95\u95052\u3001\u4e00\u4e2a\u80e1\u6912\u74f61\u3001\u4e00\u4e2a\u52fa\u5b503\u3001\u4e00\u4e2a\u756a\u83042\u548c\u4e00\u4e2a\u756a\u83041\u3002<br \/>\n&gt; \u628a\u751f\u83dc1\u653e\u5728\/\u4e0a\u9910\u684c\u4e0a<br \/>\n\u4f60\u628a\u751f\u83dc1\u653e\u5728\u4e86\u9910\u684c1\u4e0a\u3002<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p>You are in the middle of a room. Looking quickly around you, you see a cabinet<br \/>\n13, a cabinet 12, a cabinet 11, a cabinet 10, a cabinet 9, a cabinet 8, a cabinet<br \/>\n7, a cabinet 6, a cabinet 5, a cabinet 4, a cabinet 3, a cabinet 2, a cabinet<br \/>\n1, a coffeemachine 1, a countertop 1, a diningtable 1, a drawer 1, a fridge 1, a<br \/>\ngarbagecan 1, a microwave 1, a shelf 3, a shelf 2, a shelf 1, a sinkbasin 1, a<br \/>\nstoveburner 4, a stoveburner 3, a stoveburner 2, a stoveburner 1, and a toaster 1.<br \/>\nYour task is to: put a clean lettuce in diningtable.<br \/>\n&gt; think: To solve the task, I need to find and take a lettuce, then clean it with<br \/>\nsinkbasin, then put it in diningtable.<br \/>\nOK.<br \/>\n&gt; think: First I need to find a lettuce.<br \/>\nOK.<br \/>\n&gt; go to fridge 1<br \/>\nThe fridge 1 is closed.<br \/>\n&gt; think: First I need to find a lettuce.<br \/>\nOK.<br \/>\n&gt; open fridge 1<br \/>\nYou open the fridge 1. The fridge 1 is open. In it, you see a cup 3, a egg 2, a<br \/>\npotato 3, and a potato 2.<br \/>\n&gt; think: First I need to find a lettuce.<br \/>\nOK.<br \/>\n&gt; go to diningtable 1<br \/>\nOn the diningtable 1, you see a apple 1, a bread 1, a butterknife 2, a cup 2, a<br \/>\nfork 2, a knife 2, a knife 1, a ladle 1, a lettuce 1, a mug 2, a mug 1, a pan 2, a<br \/>\npeppershaker 1, a spatula 3, a tomato 2, and a tomato 1.<br \/>\n&gt; think: First I need to find a lettuce.<br \/>\nOK.<br \/>\n&gt; take lettuce 1 from diningtable 1<br \/>\nYou pick up the lettuce 1 from the diningtable 1.<br \/>\n&gt; think: I need to clean this lettuce (1) using sinkbasin 1.<br \/>\nOK.<br \/>\n&gt; go to sinkbasin 1<br \/>\nOn the sinkbasin 1, you see a apple 2, a ladle 2, a spoon 1, and a tomato 3.<br \/>\n&gt; think: I need to clean this lettuce (1) using sinkbasin 1.<br \/>\nOK.<br \/>\n&gt; clean lettuce 1 with sinkbasin 1<br \/>\nYou clean the lettuce 1 using the sinkbasin 1.<br \/>\n&gt; think: I need to put this cleaned lettuce (1) in\/on diningtable 1.<br \/>\nOK.<br \/>\n&gt; go to diningtable 1<br \/>\nOn the diningtable 1, you see a apple 1, a bread 1, a butterknife 2, a cup 2, a fork<br \/>\n2, a knife 2, a knife 1, a ladle 1, a mug 2, a mug 1, a pan 2, a peppershaker 1, a<br \/>\nspatula 3, a tomato 2, and a tomato 1.<br \/>\n&gt; think: I need to put this cleaned lettuce (1) in\/on diningtable 1.<br \/>\nOK.<br \/>\n&gt; put lettuce 1 in\/on diningtable 1<br \/>\nYou put the lettuce 1 in\/on the diningtable 1.<\/p><\/blockquote>\n<p>\u88689\uff1a\u5173\u4e8eALFWorld\u6e05\u6d01\u4efb\u52a1\u7684ReAct-IM\u884c\u52a8\u63d0\u793a\u3002<\/p>\n<p>&nbsp;<\/p>\n<blockquote><p>\u4f60\u5728\u4e00\u4e2a\u623f\u95f4\u7684\u4e2d\u592e\u3002\u5feb\u901f\u73af\u987e\u56db\u5468\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u6a71\u67dc13\uff0c\u4e00\u4e2a\u6a71\u67dc12\uff0c\u4e00\u4e2a\u6a71\u67dc11\uff0c\u4e00\u4e2a\u6a71\u67dc10\uff0c\u4e00\u4e2a\u6a71\u67dc9\uff0c\u4e00\u4e2a\u6a71\u67dc8\uff0c\u4e00\u4e2a\u6a71\u67dc7\uff0c\u4e00\u4e2a\u6a71\u67dc6\uff0c\u4e00\u4e2a\u6a71\u67dc5\uff0c\u4e00\u4e2a\u6a71\u67dc4\uff0c\u4e00\u4e2a\u6a71\u67dc3\uff0c\u4e00\u4e2a\u6a71\u67dc2\uff0c\u4e00\u4e2a\u6a71\u67dc1\uff0c\u4e00\u4e2a\u5496\u5561\u673a1\uff0c\u4e00\u4e2a\u53f0\u97621\uff0c\u4e00\u4e2a\u9910\u684c1\uff0c\u4e00\u4e2a\u62bd\u5c491\uff0c\u4e00\u4e2a\u51b0\u7bb11\uff0c\u4e00\u4e2a\u5783\u573e\u68761\uff0c\u4e00\u4e2a\u5fae\u6ce2\u70891\uff0c\u4e00\u4e2a\u67b6\u5b503\uff0c\u4e00\u4e2a\u67b6\u5b502\uff0c\u4e00\u4e2a\u67b6\u5b501\uff0c\u4e00\u4e2a\u6d17\u624b\u76c61\uff0c\u4e00\u4e2a\u7089\u7076\u71c3\u70e7\u56684\uff0c\u4e00\u4e2a\u7089\u7076\u71c3\u70e7\u56683\uff0c\u4e00\u4e2a\u7089\u7076\u71c3\u70e7\u56682\uff0c\u4e00\u4e2a\u7089\u7076\u71c3\u70e7\u56681\uff0c\u548c\u4e00\u4e2a\u70e4\u9762\u5305\u673a1\u3002<br \/>\n\u4f60\u7684\u4efb\u52a1\u662f\uff1a\u5728\u9910\u684c\u4e0a\u653e\u4e00\u9897\u5e72\u51c0\u7684\u751f\u83dc\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u8981\u89e3\u51b3\u8fd9\u4e2a\u4efb\u52a1\uff0c\u6211\u9700\u8981\u627e\u5230\u5e76\u62ff\u4e00\u9897\u751f\u83dc\uff0c\u7136\u540e\u7528\u6d17\u624b\u76c6\u6e05\u6d17\u5b83\uff0c\u518d\u628a\u5b83\u653e\u5728\u9910\u684c\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u9996\u5148\u6211\u9700\u8981\u627e\u5230\u4e00\u9897\u751f\u83dc\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u53bb\u51b0\u7bb11<br \/>\n\u51b0\u7bb11\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u9996\u5148\u6211\u9700\u8981\u627e\u5230\u4e00\u9897\u751f\u83dc\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u6253\u5f00\u51b0\u7bb11<br \/>\n\u4f60\u6253\u5f00\u4e86\u51b0\u7bb11\u3002\u51b0\u7bb11\u73b0\u5728\u662f\u5f00\u7740\u7684\u3002\u5728\u51b0\u7bb1\u91cc\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u676f\u5b503\uff0c\u4e00\u4e2a\u9e21\u86cb2\uff0c\u4e00\u4e2a\u571f\u8c463\uff0c\u548c\u4e00\u4e2a\u571f\u8c462\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u9996\u5148\u6211\u9700\u8981\u627e\u5230\u4e00\u9897\u751f\u83dc\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u53bb\u9910\u684c1<br \/>\n\u5728\u9910\u684c1\u4e0a\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u82f9\u679c1\uff0c\u4e00\u4e2a\u9762\u53051\uff0c\u4e00\u628a\u9ec4\u6cb9\u52002\uff0c\u4e00\u4e2a\u676f\u5b502\uff0c\u4e00\u4e2a\u53c9\u5b502\uff0c\u4e00\u4e2a\u5200\u5b502\uff0c\u4e00\u4e2a\u5200\u5b501\uff0c\u4e00\u4e2a\u52fa\u5b501\uff0c\u4e00\u4e2a\u9505\u94f21\uff0c\u4e00\u4e2a\u751f\u83dc1\uff0c\u4e00\u4e2a\u9a6c\u514b\u676f2\uff0c\u4e00\u4e2a\u9a6c\u514b\u676f1\uff0c\u4e00\u4e2a\u5e73\u5e95\u95052\uff0c\u4e00\u4e2a\u80e1\u6912\u74f61\uff0c\u4e00\u4e2a\u94f2\u5b503\uff0c\u4e00\u4e2a\u756a\u83042\uff0c\u548c\u4e00\u4e2a\u756a\u83041\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u9996\u5148\u6211\u9700\u8981\u627e\u5230\u4e00\u9897\u751f\u83dc\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u4ece\u9910\u684c1\u4e0a\u62ff\u8d70\u751f\u83dc1<br \/>\n\u4f60\u4ece\u9910\u684c1\u4e0a\u62ff\u8d77\u4e86\u751f\u83dc1\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u6211\u9700\u8981\u4f7f\u7528\u6d17\u624b\u76c61\u6e05\u6d17\u8fd9\u9897\u751f\u83dc\uff081\uff09\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u53bb\u6d17\u624b\u76c61<br \/>\n\u5728\u6d17\u624b\u76c61\u4e0a\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u82f9\u679c2\uff0c\u4e00\u4e2a\u9505\u94f22\uff0c\u4e00\u4e2a\u52fa\u5b501\uff0c\u548c\u4e00\u4e2a\u756a\u83043\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u6211\u9700\u8981\u4f7f\u7528\u6d17\u624b\u76c61\u6e05\u6d17\u8fd9\u9897\u751f\u83dc\uff081\uff09\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u4f7f\u7528\u6d17\u624b\u76c61\u6e05\u6d17\u751f\u83dc1<br \/>\n\u4f60\u4f7f\u7528\u6d17\u624b\u76c61\u6e05\u6d17\u4e86\u751f\u83dc1\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u6211\u9700\u8981\u628a\u8fd9\u9897\u5df2\u7ecf\u6e05\u6d17\u8fc7\u7684\u751f\u83dc\uff081\uff09\u653e\u5728\u9910\u684c\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u53bb\u9910\u684c1<br \/>\n\u5728\u9910\u684c1\u4e0a\uff0c\u4f60\u770b\u5230\u4e86\u4e00\u4e2a\u82f9\u679c1\uff0c\u4e00\u4e2a\u9762\u53051\uff0c\u4e00\u628a\u9ec4\u6cb9\u52002\uff0c\u4e00\u4e2a\u676f\u5b502\uff0c\u4e00\u4e2a\u53c9\u5b502\uff0c\u4e00\u4e2a\u5200\u5b502\uff0c\u4e00\u4e2a\u5200\u5b501\uff0c\u4e00\u4e2a\u52fa\u5b501\uff0c\u4e00\u4e2a\u9a6c\u514b\u676f2\uff0c\u4e00\u4e2a\u9a6c\u514b\u676f1\uff0c\u4e00\u4e2a\u5e73\u5e95\u95052\uff0c\u4e00\u4e2a\u80e1\u6912\u74f61\uff0c\u4e00\u4e2a\u94f2\u5b503\uff0c\u4e00\u4e2a\u756a\u83042\uff0c\u548c\u4e00\u4e2a\u756a\u83041\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u6211\u9700\u8981\u628a\u8fd9\u9897\u5df2\u7ecf\u6e05\u6d17\u8fc7\u7684\u751f\u83dc\uff081\uff09\u653e\u5728\u9910\u684c\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u628a\u751f\u83dc1\u653e\u5728\u9910\u684c\u4e0a<br \/>\n\u4f60\u628a\u751f\u83dc1\u653e\u5728\u4e86\u9910\u684c\u4e0a\u3002<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>D \u8f68\u8ff9<\/h2>\n<p>&nbsp;<\/p>\n<h3>D.1 FEVER \u8f68\u8ff9<\/h3>\n<p>\u6211\u4eec\u63d0\u4f9b\u4e86\u4e00\u4e9b\u7531ReAct\u3001CoT\u548cAct\u4ea7\u751f\u7684\u8f68\u8ff9\uff0c\u4e0b\u9762\u662fFEVER dev\u96c6\u4e2d\u51e0\u4e2a\u968f\u673a\u9009\u62e9\u793a\u4f8b\u3002\u641c\u7d22\u7ed3\u679c\u88ab\u7701\u7565\u4ee5\u8282\u7701\u7a7a\u95f4\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>\u793a\u4f8b 2491\uff08\u6807\u51c6\u7b54\u6848\uff1a\u53cd\u9a73\uff09<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nClaim: Bermuda Triangle is a loosely-defined region in the Pacific Ocean.<br \/>\nThought 1: I need to search Bermuda Triangle and find if it is in the Pacific Ocean.<br \/>\nAction 1: Search[Bermuda Triangle]<br \/>\nObservation 1: Reportedly haunted locations&#8230;<br \/>\nThought 2: The observation says that it is in the western part of the North Atlantic<br \/>\nOcean, so it is not in the Pacific Ocean.<br \/>\nAction 2: Finish[REFUTES]<br \/>\nObservation 2: Episode finished<br \/>\n<strong>Act<\/strong><br \/>\nClaim: Bermuda Triangle is a loosely-defined region in the Pacific Ocean.<br \/>\nAction 1 : Search[Bermuda Triangle]<br \/>\nObservation 1 : Reportedly haunted locations:&#8230;<br \/>\nAction 2: Finish[REFUTES]<br \/>\nObservation 2: Episode finished<br \/>\n<strong>CoT<\/strong><br \/>\nClaim: Bermuda Triangle is a loosely-defined region in the Pacific Ocean.<br \/>\nThought: Let\u2019s think step by step. The Bermuda Triangle is a loosely-defined region<br \/>\nin the Atlantic Ocean. The Pacific Ocean is not the Atlantic Ocean.<br \/>\nAnswer: REFUTES<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct\uff08\u53cd\u5e94\uff09<\/strong><\/p>\n<p>\u58f0\u660e\uff1a\u767e\u6155\u5927\u4e09\u89d2\u662f\u592a\u5e73\u6d0b\u4e0a\u4e00\u4e2a\u5b9a\u4e49\u4e0d\u4e25\u683c\u7684\u533a\u57df\u3002<\/p>\n<p>\u601d\u80031\uff1a\u6211\u9700\u8981\u641c\u7d22\u767e\u6155\u5927\u4e09\u89d2\uff0c\u627e\u51fa\u5b83\u662f\u5426\u4f4d\u4e8e\u592a\u5e73\u6d0b\u3002<\/p>\n<p>\u884c\u52a81\uff1a\u641c\u7d22[\u767e\u6155\u5927\u4e09\u89d2]<\/p>\n<p>\u89c2\u5bdf1\uff1a\u636e\u62a5\u9053\uff0c\u8fd9\u662f\u4e00\u4e9b\u95f9\u9b3c\u7684\u5730\u70b9&#8230;<\/p>\n<p>\u601d\u80032\uff1a\u89c2\u5bdf\u7ed3\u679c\u663e\u793a\uff0c\u5b83\u4f4d\u4e8e\u5317\u5927\u897f\u6d0b\u7684\u897f\u90e8\uff0c\u6240\u4ee5\u5b83\u4e0d\u5728\u592a\u5e73\u6d0b\u3002<\/p>\n<p>\u884c\u52a82\uff1a\u7ed3\u675f[\u9a73\u65a5]<\/p>\n<p>\u89c2\u5bdf2\uff1a\u60c5\u8282\u7ed3\u675f<\/p>\n<p><strong>Act\uff08\u884c\u52a8\uff09<\/strong><\/p>\n<p>\u58f0\u660e\uff1a\u767e\u6155\u5927\u4e09\u89d2\u662f\u592a\u5e73\u6d0b\u4e0a\u4e00\u4e2a\u5b9a\u4e49\u4e0d\u4e25\u683c\u7684\u533a\u57df\u3002<\/p>\n<p>\u884c\u52a81\uff1a\u641c\u7d22[\u767e\u6155\u5927\u4e09\u89d2]<\/p>\n<p>\u89c2\u5bdf1\uff1a\u636e\u62a5\u9053\uff0c\u8fd9\u662f\u4e00\u4e9b\u95f9\u9b3c\u7684\u5730\u70b9\uff1a&#8230;<\/p>\n<p>\u884c\u52a82\uff1a\u7ed3\u675f[\u9a73\u65a5]<\/p>\n<p>\u89c2\u5bdf2\uff1a\u60c5\u8282\u7ed3\u675f<\/p>\n<p><strong>CoT\uff08\u601d\u8003\u8fc7\u7a0b\uff09<\/strong><\/p>\n<p>\u58f0\u660e\uff1a\u767e\u6155\u5927\u4e09\u89d2\u662f\u592a\u5e73\u6d0b\u4e0a\u4e00\u4e2a\u5b9a\u4e49\u4e0d\u4e25\u683c\u7684\u533a\u57df\u3002<\/p>\n<p>\u601d\u8003\uff1a\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u601d\u8003\u3002\u767e\u6155\u5927\u4e09\u89d2\u662f\u5927\u897f\u6d0b\u4e0a\u4e00\u4e2a\u5b9a\u4e49\u4e0d\u4e25\u683c\u7684\u533a\u57df\u3002\u592a\u5e73\u6d0b\u4e0d\u662f\u5927\u897f\u6d0b\u3002<\/p>\n<p>\u7b54\u6848\uff1a\u9a73\u65a5<\/p>\n<p>\u901a\u8fc7\u8fd9\u4e2a\u903b\u8f91\u63a8\u7406\u8fc7\u7a0b\uff0c\u6211\u4eec\u53ef\u4ee5\u5f97\u51fa\u7ed3\u8bba\uff0c\u767e\u6155\u5927\u4e09\u89d2\u5b9e\u9645\u4e0a\u4f4d\u4e8e\u5927\u897f\u6d0b\uff0c\u800c\u4e0d\u662f\u592a\u5e73\u6d0b\u3002\u8fd9\u4e2a\u7ed3\u8bba\u662f\u57fa\u4e8e\u5bf9\u767e\u6155\u5927\u4e09\u89d2\u5730\u7406\u4f4d\u7f6e\u7684\u4e86\u89e3\u548c\u786e\u8ba4\u3002\u767e\u6155\u5927\u4e09\u89d2\u56e0\u5176\u795e\u79d8\u7684\u5931\u8e2a\u4e8b\u4ef6\u548c\u4f20\u8bf4\u800c\u95fb\u540d\uff0c\u4f46\u5730\u7406\u4f4d\u7f6e\u7684\u51c6\u786e\u6027\u540c\u6837\u91cd\u8981\uff0c\u4ee5\u907f\u514d\u8bef\u5bfc\u548c\u6df7\u6dc6\u3002<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u793a\u4f8b 5908\uff08\u6807\u51c6\u7b54\u6848\uff1a\u652f\u6301\uff09<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nClaim: Princess Mononoke is a film.<br \/>\nThought 1: I need to search Princess Mononoke and find if it is a film.<br \/>\nAction 1: Search[Princess Mononoke]<br \/>\nObservation 1: Princess Mononoke &#8230;<br \/>\nThought 2: From the observation, it says that Princess Mononoke is a film.<br \/>\nAction 2: Finish[SUPPORTS]<br \/>\nObservation 2: Episode finished<br \/>\n<strong>Act<\/strong><br \/>\nClaim: Princess Mononoke is a film.<br \/>\nAction 1: Search[Princess Mononoke]<br \/>\nObservation 1: Princess Mononoke &#8230;<br \/>\nAction 2: Finish[SUPPORTS]<br \/>\nObservation 2: Episode finished<br \/>\n<strong>CoT<\/strong><br \/>\nClaim: Princess Mononoke is a film.<br \/>\nThought: Let\u2019s think step by step. Princess Mononoke is a movie, and movies are<br \/>\nfilms.<br \/>\nAnswer: SUPPORTS<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\n\u58f0\u660e\uff1a\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b\u662f\u4e00\u90e8\u7535\u5f71\u3002<br \/>\n\u60f3\u6cd51\uff1a\u6211\u9700\u8981\u641c\u7d22\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b\uff0c\u770b\u5b83\u662f\u5426\u662f\u4e00\u90e8\u7535\u5f71\u3002<br \/>\n\u52a8\u4f5c1\uff1a\u641c\u7d22[\u7ebd\u624e\u5361\u516c\u4e3b]<br \/>\n\u89c2\u5bdf1\uff1a\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b&#8230;<br \/>\n\u60f3\u6cd52\uff1a\u4ece\u89c2\u5bdf\u4e2d\u5f97\u77e5\uff0c\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b\u662f\u4e00\u90e8\u7535\u5f71\u3002<br \/>\n\u52a8\u4f5c2\uff1a\u5b8c\u6210[\u652f\u6301]<br \/>\n\u89c2\u5bdf2\uff1a\u672c\u96c6\u8282\u76ee\u5b8c\u6210<br \/>\n<strong>Act<\/strong><br \/>\n\u58f0\u660e\uff1a\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b\u662f\u4e00\u90e8\u7535\u5f71\u3002<br \/>\n\u52a8\u4f5c1\uff1a\u641c\u7d22[\u7ebd\u624e\u5361\u516c\u4e3b]<br \/>\n\u89c2\u5bdf1\uff1a\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b&#8230;<br \/>\n\u52a8\u4f5c2\uff1a\u5b8c\u6210[\u652f\u6301]<br \/>\n\u89c2\u5bdf2\uff1a\u672c\u96c6\u8282\u76ee\u5b8c\u6210<br \/>\n<strong>CoT<\/strong><br \/>\n\u58f0\u660e\uff1a\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b\u662f\u4e00\u90e8\u7535\u5f71\u3002<br \/>\n\u60f3\u6cd5\uff1a\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u601d\u8003\u3002\u300a\u7ebd\u624e\u5361\u516c\u4e3b\u300b\u662f\u4e00\u90e8\u7535\u5f71\uff0c\u800c\u7535\u5f71\u5c31\u662f\u7535\u5f71\u3002<br \/>\n\u7b54\u6848\uff1a\u652f\u6301<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u793a\u4f8b 1951\uff08\u6807\u51c6\u7b54\u6848\uff1a\u53cd\u9a73\uff09<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nClaim: Soyuz was part of the American space program.<br \/>\nThought 1: I need to search Soyuz and find if it was part of the American space<br \/>\nprogram.<br \/>\nAction 1: Search[Soyuz]<br \/>\nObservation 1: Soyuz is a transliteration&#8230;<br \/>\nThought 2: It does not mention the American space program, so I need to search<br \/>\n&#8220;American space program&#8221; to find if it was part of it.<br \/>\nAction 2: Search[American space program]<br \/>\nObservation 2: The space policy&#8230;<br \/>\nThought 3: It does not mention Soyuz, so I am not sure if this claim is true or not.<br \/>\nAction 3: Finish[NOT ENOUGH INFO]<br \/>\nObservation 3: Episode finished<br \/>\n<strong>Act<\/strong><br \/>\nClaim: Soyuz was part of the American space program.<br \/>\nAction 1: Search[Soyuz]<br \/>\nObservation 1: Soyuz is a transliteration&#8230;<br \/>\nAction 2: Finish[NOT ENOUGH INFO]<br \/>\nObservation 2: Episode finished<br \/>\n<strong>CoT<\/strong><br \/>\nClaim: Soyuz was part of the American space program.<br \/>\nThought: Let\u2019s think step by step. Soyuz is a Russian spacecraft. The American<br \/>\nspace program is NASA. NASA and Russia have worked <a href=\"https:\/\/www.kdjingpai.com\/en\/together\/\">together<\/a> on the<br \/>\nInternational Space Station.<br \/>\nAnswer: SUPPORTS<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\n\u58f0\u660e\uff1a\u8054\u76df\u53f7\u662f\u7f8e\u56fd\u592a\u7a7a\u8ba1\u5212\u7684\u4e00\u90e8\u5206\u3002<br \/>\n\u601d\u80031\uff1a\u6211\u9700\u8981\u641c\u7d22\u8054\u76df\u53f7\uff0c\u627e\u5230\u5b83\u662f\u5426\u662f\u7f8e\u56fd\u592a\u7a7a\u8ba1\u5212\u7684\u4e00\u90e8\u5206\u3002<br \/>\n\u884c\u52a81\uff1a\u641c\u7d22[\u8054\u76df\u53f7]<br \/>\n\u89c2\u5bdf1\uff1a\u8054\u76df\u53f7\u662f\u4e00\u4e2a\u97f3\u8bd1\u8bcd&#8230;<br \/>\n\u601d\u80032\uff1a\u6ca1\u6709\u63d0\u5230\u7f8e\u56fd\u7684\u592a\u7a7a\u8ba1\u5212\uff0c\u6240\u4ee5\u6211\u9700\u8981\u641c\u7d22\u201c\u7f8e\u56fd\u592a\u7a7a\u8ba1\u5212\u201d\u6765\u627e\u5230\u5b83\u662f\u5426\u662f\u5176\u4e2d\u7684\u4e00\u90e8\u5206\u3002<br \/>\n\u884c\u52a82\uff1a\u641c\u7d22[\u7f8e\u56fd\u592a\u7a7a\u8ba1\u5212]<br \/>\n\u89c2\u5bdf2\uff1a\u592a\u7a7a\u653f\u7b56&#8230;<br \/>\n\u601d\u80033\uff1a\u6ca1\u6709\u63d0\u5230\u8054\u76df\u53f7\uff0c\u6240\u4ee5\u6211\u4e0d\u786e\u5b9a\u8fd9\u4e2a\u58f0\u660e\u662f\u771f\u662f\u5047\u3002<br \/>\n\u884c\u52a83\uff1a\u7ed3\u675f[\u4fe1\u606f\u4e0d\u8db3]<br \/>\n\u89c2\u5bdf3\uff1a\u7ed3\u675f<br \/>\n<strong>Act<\/strong><br \/>\n\u58f0\u660e\uff1a\u8054\u76df\u53f7\u662f\u7f8e\u56fd\u592a\u7a7a\u8ba1\u5212\u7684\u4e00\u90e8\u5206\u3002<br \/>\n\u884c\u52a81\uff1a\u641c\u7d22[\u8054\u76df\u53f7]<br \/>\n\u89c2\u5bdf1\uff1a\u8054\u76df\u53f7\u662f\u4e00\u4e2a\u97f3\u8bd1\u8bcd&#8230;<br \/>\n\u884c\u52a82\uff1a\u7ed3\u675f[\u4fe1\u606f\u4e0d\u8db3]<br \/>\n\u89c2\u5bdf2\uff1a\u7ed3\u675f<br \/>\n<strong>CoT<\/strong><br \/>\n\u58f0\u660e\uff1a\u8054\u76df\u53f7\u662f\u7f8e\u56fd\u592a\u7a7a\u8ba1\u5212\u7684\u4e00\u90e8\u5206\u3002<br \/>\n\u601d\u8003\uff1a\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u601d\u8003\u3002\u8054\u76df\u53f7\u662f\u4fc4\u7f57\u65af\u7684\u5b87\u5b99\u98de\u8239\u3002\u7f8e\u56fd\u7684\u592a\u7a7a\u8ba1\u5212\u662fNASA\u3002NASA\u548c\u4fc4\u7f57\u65af\u5728\u56fd\u9645\u7a7a\u95f4\u7ad9\u4e0a\u6709\u5408\u4f5c\u3002<br \/>\n\u7b54\u6848\uff1a\u652f\u6301<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u793a\u4f8b 3208\uff08\u6807\u51c6\u7b54\u6848\uff1a\u53cd\u9a73\uff09<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nClaim: Reign Over Me is an American film made in 2010.<br \/>\nThought 1: I need to search for Reign Over Me and find if it is an American film made<br \/>\nin 2010.<br \/>\nAction 1: Search[Reign Over Me]<br \/>\nObservation 1: Reign Over Me &#8230;<br \/>\nThought 2: The observation says that it is an American film made in 2007, so it is not<br \/>\nmade in 2010.<br \/>\nAction 2: Finish[REFUTES]<br \/>\nObservation 2: Episode finished<br \/>\n<strong>Act<\/strong><br \/>\nClaim: Reign Over Me is an American film made in 2010.<br \/>\nAction 1: Search[Reign Over Me]<br \/>\nAction 2: Finish[SUPPORTS]<br \/>\nObservation 2: Episode finished<br \/>\n<strong>CoT<\/strong><br \/>\nClaim: Reign Over Me is an American film made in 2010.<br \/>\nThought: Let\u2019s think step by step. First, is Reign Over Me an American film? Yes,<br \/>\nit is. Second, was it made in 2010? Yes, it was.<br \/>\nAnswer: SUPPORTS<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\n\u58f0\u660e\uff1a\u300aReign Over Me\u300b\u662f\u4e00\u90e82010\u5e74\u5236\u4f5c\u7684\u7f8e\u56fd\u7535\u5f71\u3002<br \/>\n\u60f3\u6cd51\uff1a\u6211\u9700\u8981\u641c\u7d22\u300aReign Over Me\u300b\uff0c\u786e\u8ba4\u5b83\u662f\u5426\u4e3a2010\u5e74\u5236\u4f5c\u7684\u7f8e\u56fd\u7535\u5f71\u3002<br \/>\n\u884c\u52a81\uff1a\u641c\u7d22[Reign Over Me]<br \/>\n\u89c2\u5bdf1\uff1a\u300aReign Over Me\u300b&#8230;<br \/>\n\u60f3\u6cd52\uff1a\u89c2\u5bdf\u7ed3\u679c\u663e\u793a\u5b83\u662f2007\u5e74\u5236\u4f5c\u7684\u7f8e\u56fd\u7535\u5f71\uff0c\u6240\u4ee5\u5b83\u4e0d\u662f2010\u5e74\u5236\u4f5c\u7684\u3002<br \/>\n\u884c\u52a82\uff1a\u7ed3\u675f[\u9a73\u65a5]<br \/>\n\u89c2\u5bdf2\uff1a\u7ed3\u675f<br \/>\n<strong>Act<\/strong><br \/>\n\u58f0\u660e\uff1a\u300aReign Over Me\u300b\u662f\u4e00\u90e82010\u5e74\u5236\u4f5c\u7684\u7f8e\u56fd\u7535\u5f71\u3002<br \/>\n\u884c\u52a81\uff1a\u641c\u7d22[Reign Over Me]<br \/>\n\u884c\u52a82\uff1a\u7ed3\u675f[\u652f\u6301]<br \/>\n\u89c2\u5bdf2\uff1a\u7ed3\u675f<br \/>\n<strong>CoT<\/strong><br \/>\n\u58f0\u660e\uff1a\u300aReign Over Me\u300b\u662f\u4e00\u90e82010\u5e74\u5236\u4f5c\u7684\u7f8e\u56fd\u7535\u5f71\u3002<br \/>\n\u60f3\u6cd5\uff1a\u8ba9\u6211\u4eec\u4e00\u6b65\u4e00\u6b65\u6765\u3002\u9996\u5148\uff0c\u300aReign Over Me\u300b\u662f\u90e8\u7f8e\u56fd\u7535\u5f71\u5417\uff1f\u662f\u7684\uff0c\u5b83\u662f\u3002\u5176\u6b21\uff0c\u5b83\u662f2010\u5e74\u5236\u4f5c\u7684\u5417\uff1f\u662f\u7684\uff0c\u5b83\u662f\u3002<br \/>\n\u56de\u7b54\uff1a\u652f\u6301<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<h3>D.2 ALFWORLD \u8f68\u8ff9<\/h3>\n<p>\u6211\u4eec\u63d0\u4f9b\u4e86ReAct\u3001Act\u548cReAct-IM\u5728\u540c\u4e00ALFWorld\u6e38\u620f\u4e2d\u7684\u793a\u4f8b\u8f68\u8ff9\uff0cpick_clean_then_place_in_recep-Knife-None-CounterTop-10\/ trial_T20190909_110445_675754\u3002<\/p>\n<p>&nbsp;<\/p>\n<h4><strong>D.2.1 REACT \u8f68\u8ff9<\/strong><\/h4>\n<p>ReAct\u80fd\u591f\u6b63\u786e\u627e\u5230\u5200\u3001\u6e05\u6d01\u5b83\uff0c\u7136\u540e\u5c06\u5176\u653e\u5728\u53f0\u9762\u4e0a\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>ReAct ALFWorld trajectory<\/strong><\/p>\n<blockquote><p>You are in the middle of a room. Looking quickly around you, you see a cabinet 6, a<br \/>\ncabinet 5, a cabinet 4, a cabinet 3, a cabinet 2, a cabinet 1, a coffeemachine 1, a<br \/>\ncountertop 3, a countertop 2, a countertop 1, a drawer 3, a drawer 2, a drawer 1, a<br \/>\nfridge 1, a garbagecan 1, a microwave 1, a shelf 3, a shelf 2, a shelf 1, a sinkbasin<br \/>\n1, a stoveburner 4, a stoveburner 3, a stoveburner 2, a stoveburner 1, and a toaster<br \/>\n1.<br \/>\nYour task is to: put a clean knife in countertop.<br \/>\n&gt; think: To solve the task, I need to find and take a knife, then clean it with<br \/>\nsinkbasin, then put it in countertop.<br \/>\nOK.<br \/>\n&gt; think: First I need to find a knife. A knife is more likely to appear in cabinet<br \/>\n(1-6), drawer (1-3), countertop (1-3), fridge (1), garbagecan (1), shelf (1-3),<br \/>\nsinkbasin (1), stoveburner (1-4), toaster (1). I can check one by one, starting with<br \/>\ncabinet 1.<br \/>\nOK.<br \/>\n&gt; go to cabinet 1<br \/>\nOn the cabinet 1, you see a bowl 1.<br \/>\n&gt; go to cabinet 2<br \/>\nThe cabinet 2 is closed.<br \/>\n&gt; go to cabinet 3<br \/>\nOn the cabinet 3, you see a glassbottle 1.<br \/>\n&gt; go to cabinet 4<br \/>\nOn the cabinet 4, you see a mug 1.<br \/>\n&gt; go to cabinet 5<br \/>\nThe cabinet 5 is closed.<br \/>\n&gt; go to cabinet 6<br \/>\nThe cabinet 6 is closed.<br \/>\n&gt; go to drawer 1<br \/>\nThe drawer 1 is closed.<br \/>\n&gt; go to drawer 2<br \/>\nThe drawer 2 is closed.<br \/>\n&gt; go to drawer 3<br \/>\nThe drawer 3 is closed.<br \/>\n&gt; go to countertop 1<br \/>\nOn the countertop 1, you see a lettuce 2, a mug 2, a peppershaker 1, and a spoon 2.<br \/>\n&gt; go to countertop 2<br \/>\nOn the countertop 2, you see a cup 1, a dishsponge 1, a glassbottle 3, a knife 1, a<br \/>\nplate 2, a potato 3, and a statue 1.<br \/>\n&gt; think: Now I find a knife (1). Next, I need to take it.<br \/>\nOK.<br \/>\n&gt; take knife 1 from countertop 2<br \/>\nYou pick up the knife 1 from the countertop 2.<br \/>\n&gt; think: Now I take a knife (1). Next, I need to go to sinkbasin (1) and clean it.<br \/>\nOK.<br \/>\n&gt; go to sinkbasin 1<br \/>\nOn the sinkbasin 1, you see a fork 3, a lettuce 3, and a spatula 2.<br \/>\n&gt; clean knife 1 with sinkbasin 1<br \/>\nYou clean the knife 1 using the sinkbasin 1.<br \/>\n&gt; think: Now I clean a knife (1). Next, I need to put it in\/on countertop 1.<br \/>\nOK.<br \/>\n&gt; go to countertop 1<br \/>\nOn the countertop 1, you see a lettuce 2, a mug 2, a peppershaker 1, and a spoon 2.<br \/>\n&gt; put knife 1 in\/on countertop 1<br \/>\nYou put the knife 1 in\/on the countertop 1.<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p>\u4f60\u4f4d\u4e8e\u623f\u95f4\u4e2d\u592e\u3002\u5feb\u901f\u73af\u987e\u56db\u5468\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u6a71\u67dc6\uff0c\u4e00\u4e2a\u6a71\u67dc5\uff0c\u4e00\u4e2a\u6a71\u67dc4\uff0c\u4e00\u4e2a\u6a71\u67dc3\uff0c\u4e00\u4e2a\u6a71\u67dc2\uff0c\u4e00\u4e2a\u6a71\u67dc1\uff0c\u4e00\u4e2a\u5496\u5561\u673a1\uff0c\u4e00\u4e2a\u684c\u97623\uff0c\u4e00\u4e2a\u684c\u97622\uff0c\u4e00\u4e2a\u684c\u97621\uff0c\u4e00\u4e2a\u62bd\u5c493\uff0c\u4e00\u4e2a\u62bd\u5c492\uff0c\u4e00\u4e2a\u62bd\u5c491\uff0c\u4e00\u4e2a\u51b0\u7bb11\uff0c\u4e00\u4e2a\u5783\u573e\u68761\uff0c\u4e00\u4e2a\u5fae\u6ce2\u70891\uff0c\u4e00\u4e2a\u67b6\u5b503\uff0c\u4e00\u4e2a\u67b6\u5b502\uff0c\u4e00\u4e2a\u67b6\u5b501\uff0c\u4e00\u4e2a\u6c34\u69fd1\uff0c\u4e00\u4e2a\u7076\u76d84\uff0c\u4e00\u4e2a\u7076\u76d83\uff0c\u4e00\u4e2a\u7076\u76d82\uff0c\u4e00\u4e2a\u7076\u76d81\uff0c\u548c\u4e00\u4e2a\u70e4\u9762\u5305\u673a1\u3002<br \/>\n\u4f60\u7684\u4efb\u52a1\u662f\uff1a\u628a\u4e00\u628a\u5e72\u51c0\u7684\u5200\u653e\u5728\u684c\u9762\u4e0a\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u4e3a\u4e86\u5b8c\u6210\u4efb\u52a1\uff0c\u6211\u9700\u8981\u627e\u5230\u5e76\u62ff\u8d77\u4e00\u628a\u5200\uff0c\u7136\u540e\u7528\u6c34\u69fd\u6e05\u6d17\u5b83\uff0c\u7136\u540e\u653e\u5728\u684c\u9762\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u9996\u5148\u6211\u9700\u8981\u627e\u5230\u4e00\u628a\u5200\u3002\u4e00\u628a\u5200\u66f4\u6709\u53ef\u80fd\u51fa\u73b0\u5728\u6a71\u67dc\uff081-6\uff09\uff0c\u62bd\u5c49\uff081-3\uff09\uff0c\u684c\u9762\uff081-3\uff09\uff0c\u51b0\u7bb1\uff081\uff09\uff0c\u5783\u573e\u6876\uff081\uff09\uff0c\u67b6\u5b50\uff081-3\uff09\uff0c\u6c34\u69fd\uff081\uff09\uff0c\u7076\u76d8\uff081-4\uff09\uff0c\u70e4\u9762\u5305\u673a\uff081\uff09\u3002\u6211\u53ef\u4ee5\u4e00\u4e2a\u4e00\u4e2a\u5730\u68c0\u67e5\uff0c\u4ece\u6a71\u67dc1\u5f00\u59cb\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u6a71\u67dc1<br \/>\n\u5728\u6a71\u67dc1\u4e0a\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u78971\u3002<br \/>\n&gt; \u524d\u5f80\u6a71\u67dc2<br \/>\n\u6a71\u67dc2\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u6a71\u67dc3<br \/>\n\u5728\u6a71\u67dc3\u4e0a\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u73bb\u7483\u74f61\u3002<br \/>\n&gt; \u524d\u5f80\u6a71\u67dc4<br \/>\n\u5728\u6a71\u67dc4\u4e0a\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u676f\u5b501\u3002<br \/>\n&gt; \u524d\u5f80\u6a71\u67dc5<br \/>\n\u6a71\u67dc5\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u6a71\u67dc6<br \/>\n\u6a71\u67dc6\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u62bd\u5c491<br \/>\n\u62bd\u5c491\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u62bd\u5c492<br \/>\n\u62bd\u5c492\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u62bd\u5c493<br \/>\n\u62bd\u5c493\u662f\u5173\u95ed\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u684c\u97621<br \/>\n\u5728\u684c\u97621\u4e0a\uff0c\u4f60\u770b\u5230\u4e00\u5934\u751f\u83dc2\uff0c\u4e00\u4e2a\u676f\u5b502\uff0c\u4e00\u4e2a\u9ed1\u80e1\u6912\u76d0\u7f501\uff0c\u548c\u4e24\u628a\u53192\u3002<br \/>\n&gt; \u524d\u5f80\u684c\u97622<br \/>\n\u5728\u684c\u97622\u4e0a\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u676f\u5b501\uff0c\u4e00\u4e2a\u5237\u76d8\u7ef51\uff0c\u4e00\u4e2a\u73bb\u7483\u74f63\uff0c\u4e00\u628a\u52001\uff0c\u4e00\u4e2a\u76d8\u5b502\uff0c\u4e09\u4e2a\u571f\u8c463\uff0c\u548c\u4e00\u4e2a\u96d5\u50cf1\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u73b0\u5728\u6211\u627e\u5230\u4e00\u628a\u5200\uff081\uff09\u3002\u63a5\u4e0b\u6765\uff0c\u6211\u9700\u8981\u62ff\u5b83\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u4ece\u684c\u97622\u4e0a\u62ff\u8d77\u52001<br \/>\n\u4f60\u4ece\u684c\u97622\u4e0a\u62ff\u8d77\u52001\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u73b0\u5728\u6211\u62ff\u8d77\u4e00\u628a\u5200\uff081\uff09\u3002\u63a5\u4e0b\u6765\uff0c\u6211\u9700\u8981\u53bb\u6c34\u69fd\uff081\uff09\u6e05\u6d17\u5b83\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u6c34\u69fd1<br \/>\n\u5728\u6c34\u69fd1\u4e0a\uff0c\u4f60\u770b\u5230\u4e00\u4e2a\u53c9\u5b503\uff0c\u4e00\u5934\u751f\u83dc3\uff0c\u548c\u4e00\u4e2a\u7ffb\u9505\u94f22\u3002<br \/>\n&gt; \u7528\u6c34\u69fd1\u6e05\u6d17\u52001<br \/>\n\u4f60\u7528\u6c34\u69fd1\u6e05\u6d17\u52001\u3002<br \/>\n&gt; \u601d\u8003\uff1a\u73b0\u5728\u6211\u6e05\u6d17\u4e86\u4e00\u628a\u5200\uff081\uff09\u3002\u63a5\u4e0b\u6765\uff0c\u6211\u9700\u8981\u628a\u5b83\u653e\u5728\/\u4e8e\u684c\u97621\u4e0a\u3002<br \/>\n\u597d\u7684\u3002<br \/>\n&gt; \u524d\u5f80\u684c\u97621<br \/>\n\u5728\u684c\u97621\u4e0a\uff0c\u4f60\u770b\u5230\u4e00\u5934\u751f\u83dc2\uff0c\u4e00\u4e2a\u676f\u5b502\uff0c\u4e00\u4e2a\u9ed1\u80e1\u6912\u76d0\u7f501\uff0c\u548c\u4e24\u628a\u53192\u3002<br \/>\n&gt; \u628a\u52001\u653e\u5728\/\u4e8e\u684c\u97621\u4e0a<br \/>\n\u4f60\u628a\u52001\u653e\u5728\/\u4e8e\u684c\u97621\u4e0a\u3002<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<h4><strong>D.2.2 ACT \u8f68\u8ff9<\/strong><\/h4>\n<p>\u52a8\u4f5c\u6a21\u578b\u80fd\u591f\u6b63\u786e\u627e\u5230\u5200\u5177\uff0c\u4f46\u5728\u5b9e\u9645\u524d\u5f80\u6c34\u69fd\u6d17\u624b\u76c6\u4e4b\u524d\uff0c\u5c1d\u8bd5\u4f7f\u7528\u6c34\u69fd\u6d17\u624b\u76c6\u6e05\u6d01\u5b83\u3002\u4ece\u90a3\u65f6\u8d77\uff0c\u6a21\u578b\u65e0\u6cd5\u6062\u590d\uff0c\u5e76\u9677\u5165\u91cd\u590d\u76f8\u540c\u7684\u547d\u4ee4\u5e8f\u5217\u3002\u4f7f\u7528ReAct\u6a21\u578b\uff0c\u5df2\u6709\u7684\u60f3\u6cd5\u4f1a\u5177\u4f53\u8bc6\u522b\u51fa\u5200\u5177\u5df2\u7ecf\u88ab\u62ff\u8d70\uff0c\u4e0b\u4e00\u4e2a\u5b50\u76ee\u6807\u662f\u524d\u5f80\u6c34\u69fd\u6d17\u624b\u76c6\u8fdb\u884c\u6e05\u6d01\u3002<\/p>\n<h4><strong>D.2.3 REACT-IM \u8f68\u8ff9<\/strong><\/h4>\n<p>ReAct-IM\u80fd\u591f\u6b63\u786e\u627e\u5230\u5200\u5177\uff0c\u4f46\u4e5f\u65e0\u6cd5\u6e05\u6d01\u5b83\u3002\u7136\u540eLLM\u5728\u5c1d\u8bd5\u5c06\u8fd9\u628a\u5200\u653e\u5728\u53f0\u9762\u4e0a\u65f6\u9677\u5165\u56f0\u5883\u3002\u4e00\u4e2a\u53ef\u80fd\u7684\u95ee\u9898\u662f\u9519\u8bef\u7684\u60f3\u6cd5\uff1athink: \u6211\u9700\u8981\u627e\u5230\u4e00\u628a\u5e72\u51c0\u7684\u5200\u3002\u8fd9\u4f3c\u4e4e\u8ba9LLM\u8bef\u4ee5\u4e3a\u5200\u5177\u5df2\u7ecf\u88ab\u6e05\u6d01\u8fc7\u4e86\u3002\u5728ReAct\u4e2d\uff0c\u8fd9\u4e00\u7cfb\u5217\u5b50\u76ee\u6807\u5c06\u901a\u8fc7\u6bcf\u4e2a\u60f3\u6cd5\u5177\u4f53\u6355\u6349\u3002<\/p>\n<p>&nbsp;<\/p>\n<h3>D.3 WEBSHOP \u8f68\u8ff9<\/h3>\n<p><strong>\u6307\u4ee4\uff1a<\/strong>\u7ed9\u6211\u4e70\u4e00\u5305\u5341\u516d\u5305\u88c5\u7684\u82f9\u679c\u8089\u6842\u5473\u51bb\u5e72\u9999\u8549\u7247\uff0c\u4ef7\u683c\u4f4e\u4e8e50.00\u7f8e\u5143<\/p>\n<p><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2536\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-12\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/a1794d053c604f0.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-12\" width=\"706\" height=\"843\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/a1794d053c604f0.png 706w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/a1794d053c604f0-251x300.png 251w\" sizes=\"auto, (max-width: 706px) 100vw, 706px\" \/><\/p>\n<p>\u886810\uff1a\u7531Act\u548cReAct\u9884\u6d4b\u7684Webshop\u793a\u4f8b\u8f68\u8ff9\u3002\u4e0eAct\u76f8\u6bd4\uff0cReAct\u4f7f\u7528\u63a8\u7406\u6765\u5bfb\u627e\u6ee1\u8db3\u6240\u6709\u76ee\u6807\u5c5e\u6027\u7684\u4ea7\u54c1\u3002<\/p>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<h2>E \u66f4\u591a\u5206\u6790<\/h2>\n<p>&nbsp;<\/p>\n<h3>E.1 \u6210\u529f\u548c\u5931\u8d25\u6a21\u5f0f\u5206\u6790<\/h3>\n<p>\u6211\u4eec\u63d0\u4f9b\u4e86\u4e00\u4e9b\u5bf9\u5e94\u4e8e\u7b2c3.3\u8282\u4e2d\u7ed9\u51fa\u7684\u6210\u529f\u548c\u9519\u8bef\u6a21\u5f0f\u5206\u6790\u7684\u4f8b\u5b50\u3002\u4e3a\u4e86\u8282\u7701\u7a7a\u95f4\uff0c\u641c\u7d22\u7ed3\u679c\u548c\u975e\u4ee3\u8868\u6027\u6b65\u9aa4\u88ab\u7701\u7565\u3002<\/p>\n<p>&nbsp;<\/p>\n<p><strong>\u9884\u6d4b\u6b63\u786e\/Success: True positive<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nQuestion: Author David Chanoff has collaborated with a U.S. Navy admiral who served as<br \/>\nthe ambassador to the United Kingdom under which President?<br \/>\nThought 1: I need to search David Chanoff and find the U.S. Navy admiral he<br \/>\ncollaborated with.<br \/>\nAction 1: Search[David Chanoff]<br \/>\nObservation 1: David Chanoff is a noted author&#8230;<br \/>\nAction 2: Search[William J. Crowe]<br \/>\nObservation 2: William J. Crowe is&#8230;<br \/>\nThought 3: William J. Crowe served as the ambassador to the United Kingdom under<br \/>\nPresident Bill Clinton. So the answer is Bill Clinton.<br \/>\nAction 3: Finish[Bill Clinton]<br \/>\nObservation 3: Episode finished<br \/>\n<strong>CoT<\/strong><br \/>\nQuestion: What was the name of the team that represented an Arizona university in<br \/>\nthe conference that covers a broad expanse of the western United States,<br \/>\nincluding Arizona, California, and New Mexico?<br \/>\nThought: Let\u2019s think step by step. The name of the team that represented an Arizona<br \/>\nuniversity in the conference that covers a broad expanse of the western<br \/>\nUnited States, including Arizona, California, and New Mexico is Arizona<br \/>\nState Sun Devils.<br \/>\nAnswer: Arizona State Sun Devils<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\n\u95ee\u9898\uff1a\u4f5c\u8005\u5927\u536b\u00b7\u67e5\u8bfa\u592b\u66fe\u4e0e\u4e00\u4f4d\u7f8e\u56fd\u6d77\u519b\u5c06\u519b\u5408\u4f5c\uff0c\u8fd9\u4f4d\u5c06\u519b\u5728\u54ea\u4f4d\u603b\u7edf\u7684\u4efb\u671f\u4e0b\u66fe\u62c5\u4efb\u82f1\u56fd\u5927\u4f7f\uff1f<br \/>\n\u601d\u80031\uff1a\u6211\u9700\u8981\u67e5\u627e\u5927\u536b\u00b7\u67e5\u8bfa\u592b\uff0c\u5e76\u627e\u51fa\u4ed6\u5408\u4f5c\u8fc7\u7684\u7f8e\u56fd\u6d77\u519b\u5c06\u519b\u3002<br \/>\n\u884c\u52a81\uff1a\u641c\u7d22[\u5927\u536b\u00b7\u67e5\u8bfa\u592b]<br \/>\n\u89c2\u5bdf1\uff1a\u5927\u536b\u00b7\u67e5\u8bfa\u592b\u662f\u4e00\u4f4d\u8457\u540d\u7684\u4f5c\u8005&#8230;<br \/>\n\u884c\u52a82\uff1a\u641c\u7d22[\u5a01\u5ec9\u00b7J\u00b7\u514b\u6d1b]<br \/>\n\u89c2\u5bdf2\uff1a\u5a01\u5ec9\u00b7J\u00b7\u514b\u6d1b\u662f&#8230;<br \/>\n\u601d\u80033\uff1a\u5a01\u5ec9\u00b7J\u00b7\u514b\u6d1b\u5728\u6bd4\u5c14\u00b7\u514b\u6797\u987f\u7684\u603b\u7edf\u4efb\u671f\u4e0b\u62c5\u4efb\u82f1\u56fd\u5927\u4f7f\u3002\u6240\u4ee5\u7b54\u6848\u662f\u6bd4\u5c14\u00b7\u514b\u6797\u987f\u3002<br \/>\n\u884c\u52a83\uff1a\u7ed3\u675f[\u6bd4\u5c14\u00b7\u514b\u6797\u987f]<br \/>\n\u89c2\u5bdf3\uff1a\u8fdb\u884c\u5b8c\u6bd5<br \/>\n<strong>CoT<\/strong><br \/>\n\u95ee\u9898\uff1a\u5728\u6db5\u76d6\u4e86\u4e9a\u5229\u6851\u90a3\u5dde\u3001\u52a0\u5229\u798f\u5c3c\u4e9a\u5dde\u548c\u65b0\u58a8\u897f\u54e5\u5dde\u7b49\u7f8e\u56fd\u897f\u90e8\u5e7f\u5927\u5730\u533a\u7684\u4f1a\u8bae\u4e2d\uff0c\u54ea\u4e2a\u4ee3\u8868\u4e9a\u5229\u6851\u90a3\u67d0\u5927\u5b66\u7684\u56e2\u961f\u53c2\u52a0\uff1f<br \/>\n\u601d\u8003\uff1a\u6211\u4eec\u6765\u9010\u6b65\u5206\u6790\u3002\u5728\u6db5\u76d6\u4e86\u4e9a\u5229\u6851\u90a3\u5dde\u3001\u52a0\u5229\u798f\u5c3c\u4e9a\u5dde\u548c\u65b0\u58a8\u897f\u54e5\u5dde\u7b49\u7f8e\u56fd\u897f\u90e8\u5e7f\u5927\u5730\u533a\u7684\u4f1a\u8bae\u4e2d\uff0c\u4ee3\u8868\u4e9a\u5229\u6851\u90a3\u67d0\u5927\u5b66\u53c2\u52a0\u7684\u56e2\u961f\u662f\u4e9a\u5229\u6851\u90a3\u5dde\u7acb\u5927\u5b66\u592a\u9633\u6076\u9b54\u961f\u3002<br \/>\n\u56de\u7b54\uff1a\u4e9a\u5229\u6851\u90a3\u5dde\u7acb\u5927\u5b66\u592a\u9633\u6076\u9b54\u961f<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u9884\u6d4b\u9519\u8bef\/Success: False positive<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nQuestion: Did the board game San Marco or About Time come out first?<br \/>\nThought 1: I need to search San Marco and About Time, and find which came out first.<br \/>\nAction 1: Search[San Marco]<br \/>\nObservation 1: San Marco is one of the &#8230; The was built in venice.<br \/>\nThought 2: San Marco is a sestiere of Venice. I need to search About Time next.<br \/>\nAction 2: Search[About Time]<br \/>\nObservation 2: Could not find [About Time]. Similar: [&#8230;].<br \/>\nThought 3: About Time is a 2013 film. So San Marco came out first.<br \/>\nAction 3: Finish[San Marco]<br \/>\nObservation 3: Episode finished<br \/>\n<strong>CoT<\/strong><br \/>\nQuestion: Was Vanderbilt University or Emory University founded first?<br \/>\nThought: Let\u2019s think step by step. Vanderbilt University was founded in 1873. Emory<br \/>\nUniversity was founded in 1836. 1873 (Vanderbilt University) &gt; 1836 (Emory<br \/>\nUniversity), so Vanderbilt University was founded first.<br \/>\nAnswer: Emory University<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\n\u95ee\u9898\uff1a\u300a\u5723\u9a6c\u53ef\u300b\u6216\u300a\u5173\u4e8e\u65f6\u95f4\u300b\u8fd9\u4e24\u6b3e\u684c\u6e38\u54ea\u4e2a\u9996\u5148\u9762\u4e16\uff1f<br \/>\n\u601d\u80031\uff1a\u6211\u9700\u8981\u627e\u51fa\u300a\u5723\u9a6c\u53ef\u300b\u548c\u300a\u5173\u4e8e\u65f6\u95f4\u300b\u54ea\u6b3e\u6e38\u620f\u4f18\u5148\u53d1\u5e03\u3002<br \/>\n\u884c\u52a81\uff1a\u641c\u7d22[\u5723\u9a6c\u53ef]<br \/>\n\u89c2\u5bdf1\uff1a\u5723\u9a6c\u53ef\u662f&#8230; \u8fd9\u662f\u5728\u5a01\u5c3c\u65af\u5efa\u9020\u7684\u3002<br \/>\n\u601d\u80032\uff1a\u5723\u9a6c\u53ef\u662f\u5a01\u5c3c\u65af\u7684\u4e00\u4e2a\u533a\u3002\u63a5\u4e0b\u6765\u6211\u9700\u8981\u641c\u7d22\u300a\u5173\u4e8e\u65f6\u95f4\u300b<br \/>\n\u884c\u52a82\uff1a\u641c\u7d22[\u5173\u4e8e\u65f6\u95f4]<br \/>\n\u89c2\u5bdf2\uff1a\u672a\u80fd\u627e\u5230[\u5173\u4e8e\u65f6\u95f4]\u3002\u800c\u662f\u627e\u5230\u4e86[\u2026]\u3002<br \/>\n\u601d\u80033\uff1a\u300a\u5173\u4e8e\u65f6\u95f4\u300b\u662f2013\u5e74\u4e0a\u6620\u7684\u4e00\u90e8\u7535\u5f71\uff0c\u56e0\u6b64\uff0c\u300a\u5723\u9a6c\u53ef\u300b\u5e94\u8be5\u662f\u9996\u6b3e\u53d1\u5e03\u7684\u3002<br \/>\n\u884c\u52a83\uff1a\u7ed3\u675f\u641c\u7d22[\u5723\u9a6c\u53ef]<br \/>\n\u89c2\u5bdf3\uff1a\u4efb\u52a1\u7ed3\u675f<br \/>\n<strong>CoT<\/strong><br \/>\n\u95ee\u9898\uff1a\u8303\u5fb7\u5821\u5927\u5b66\u548c\u57c3\u9ed8\u91cc\u5927\u5b66\u54ea\u4e00\u6240\u9996\u5148\u5efa\u7acb\uff1f<br \/>\n\u601d\u8003\uff1a\u9996\u5148\uff0c\u8303\u5fb7\u5821\u5927\u5b66\u6210\u7acb\u4e8e1873\u5e74\uff0c\u57c3\u9ed8\u91cc\u5927\u5b66\u6210\u7acb\u4e8e1836\u5e74\uff0c\u4ece\u65f6\u95f4\u5148\u540e\u770b\uff0c\u8303\u5fb7\u5821\u5927\u5b66\uff081873\u5e74\uff09\u665a\u4e8e\u57c3\u9ed8\u91cc\u5927\u5b66\uff081836\u5e74\uff09\uff0c\u4e5f\u5c31\u662f\u8bf4\uff0c\u57c3\u9ed8\u91cc\u5927\u5b66\u7684\u5efa\u7acb\u65f6\u95f4\u5728\u524d\u3002<br \/>\n\u7b54\u6848\uff1a\u57c3\u9ed8\u91cc\u5927\u5b66\u5728\u5148\u3002<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u5931\u8d25\uff1a\u63a8\u7406\u9519\u8bef\/Failure: Reasoning error<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nQuestion: What was the middle name of the actress who was cast alongside Harvey<br \/>\nFierstein, Linda Hart, Dick Latessa, Clarke Thorell, Mary Bond Davis, Laura<br \/>\nBell Bundy, Matthew Morrison, Corey Reynolds, and Marissa Jaret Winokur in<br \/>\nHairspray?<br \/>\nThought 1: I need to search Harvey Fierstein, Linda Hart, Dick Latessa, Clarke Thorell,<br \/>\nMary Bond Davis, Laura Bell Bundy, Matthew Morrison, Corey Reynolds, and<br \/>\nMarissa Jaret Winokur, find the actress that was cast alongside them in<br \/>\nHairspray, then find its middle name.<br \/>\nAction 1: Search[Harvey Fierstein]<br \/>\nObservation 1: Harvey Forbes Fierstein &#8230;<br \/>\nThought 2: Harvey Fierstein is an actor, playwright, and screenwriter. I need to<br \/>\nsearch Linda Hart next&#8230;<br \/>\nAction 2: Search[Linda Hart]&#8230;<br \/>\n<strong>CoT<\/strong><br \/>\nQuestion: Who is older Danny Green or James Worthy?<br \/>\nThought: Let\u2019s think step by step. Danny Green was born in 1987. James Worthy was<br \/>\nborn in 1961. 1987 (Danny Green) &gt; 1961 (James Worthy), so Danny Green is<br \/>\nolder.<br \/>\nAnswer: Danny Green<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\n\u95ee\u9898\uff1a\u5728\u300a\u53d1\u80f6\u300b\u4e2d\uff0c\u548cHarvey Fierstein\u3001Linda Hart\u3001Dick Latessa\u3001Clarke Thorell\u3001Mary Bond Davis\u3001Laura Bell Bundy\u3001Matthew Morrison\u3001Corey Reynolds\u4ee5\u53caMarissa Jaret Winokur\u4e00\u8d77\u6f14\u51fa\u7684\u5973\u6f14\u5458\u4e2d\u95f4\u540d\u662f\u4ec0\u4e48\uff1f<br \/>\n\u60f3\u6cd51\uff1a\u6211\u9700\u8981\u67e5\u627eHarvey Fierstein\u3001Linda Hart\u3001Dick Latessa\u3001Clarke Thorell\u3001Mary Bond Davis\u3001Laura Bell Bundy\u3001Matthew Morrison\u3001Corey Reynolds\u548cMarissa Jaret Winokur\uff0c\u627e\u51fa\u548c\u4ed6\u4eec\u5728\u5267\u4e2d\u4e00\u8d77\u6f14\u51fa\u7684\u5973\u6f14\u5458\uff0c\u5e76\u627e\u5230\u5979\u7684\u4e2d\u95f4\u540d\u3002<br \/>\n\u52a8\u4f5c1\uff1a\u641c\u7d22[Harvey Fierstein]<br \/>\n\u89c2\u5bdf1\uff1aHarvey Forbes Fierstein&#8230;<br \/>\n\u60f3\u6cd52\uff1aHarvey Fierstein\u662f\u4e00\u4f4d\u6f14\u5458\u3001\u5267\u4f5c\u5bb6\u548c\u7f16\u5267\u3002\u63a5\u4e0b\u6765\u9700\u8981\u641c\u7d22Linda Hart&#8230;<br \/>\n\u52a8\u4f5c2\uff1a\u641c\u7d22[Linda Hart]&#8230;<\/p>\n<p><strong>CoT<\/strong><br \/>\n\u95ee\u9898\uff1aDanny Green\u548cJames Worthy\u8c01\u5e74\u9f84\u66f4\u5927\uff1f<br \/>\n\u601d\u8003\uff1a\u6211\u4eec\u5206\u6b65\u8fdb\u884c\u3002Danny Green\u51fa\u751f\u57281987\u5e74\uff0c\u800cJames Worthy\u51fa\u751f\u57281961\u5e74\u30021987\uff08Danny Green\uff09&gt; 1961\uff08James Worthy\uff09\uff0c\u56e0\u6b64\uff0cDanny Green\u66f4\u5e74\u957f\u3002<br \/>\n\u56de\u7b54\uff1aDanny Green<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u5931\u8d25\uff1a\u641c\u7d22\u9519\u8bef\/Failure: Search error<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nQuestion: What does the goddess associated with the goddess frigg consists of what<br \/>\ntales?<br \/>\nThought 1: I need to search goddess frigg and find its associated goddess.<br \/>\nAction 1: Search[goddess frigg]<br \/>\nObservation 1: Could not find goddess frigg. Similar: [\u2019Frigg\u2019, \u2019Frigg and Freyja common<br \/>\norigin hypothesis\u2019, \u2019Freyja (section Relation to Frigg and other goddesses<br \/>\nand figures)\u2019, \u2019Eir (redirect from Eir (goddess))\u2019, \u2019Baldr\u2019].<br \/>\nThought 2: I need to search Frigg instead&#8230;<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><\/p>\n<p>\u95ee\u9898\uff1a\u548c\u5973\u795eFrigg\u6709\u5173\u7684\u5973\u795e\u7531\u4ec0\u4e48\u6545\u4e8b\u6784\u6210\uff1f<br \/>\n\u60f3\u6cd51\uff1a\u6211\u9700\u8981\u641c\u7d22\u5973\u795eFrigg\u5e76\u627e\u51fa\u4e0e\u5979\u6709\u5173\u7684\u5973\u795e\u3002<br \/>\n\u52a8\u4f5c1\uff1a\u641c\u7d22[\u5973\u795eFrigg]<br \/>\n\u89c2\u5bdf1\uff1a\u65e0\u6cd5\u627e\u5230\u5973\u795eFrigg\u3002\u76f8\u4f3c\u7684\u6709\uff1a[&#8216;Frigg&#8217;\uff0c&#8217;Frigg\u548cFreyja\u5171\u540c\u8d77\u6e90\u7684\u5047\u8bf4&#8217;\uff0c&#8217;Freyja\uff08\u4e0eFrigg\u548c\u5176\u4ed6\u5973\u795e\u4ee5\u53ca\u4eba\u7269\u7684\u5173\u7cfb\uff09&#8217;\uff0c&#8217;Eir\uff08\u4eceEir\uff08\u5973\u795e\uff09\u91cd\u5b9a\u5411\uff09&#8217;\uff0c&#8217;Baldr&#8217;]\u3002<br \/>\n\u60f3\u6cd52\uff1a\u6211\u9700\u8981\u6362\u4e2a\u65b9\u5f0f\u641c\u7d22Frigg&#8230;<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u5931\u8d25\uff1a\u5e7b\u89c9\/Failure: Hallucination<\/strong><\/p>\n<blockquote><p><strong>CoT<\/strong><br \/>\nQuestion: What was the first year a scientific journal published by an organization<br \/>\nlocated in the Bronx was published?<br \/>\nThought: Let\u2019s think step by step. The first year a scientific journal published by<br \/>\nan organization located in the Bronx was published was 1916.<br \/>\nAnswer: 1916 (Label: 1909)<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>CoT<\/strong><br \/>\n\u95ee\u9898\uff1a\u4f4d\u4e8e\u5e03\u6717\u514b\u65af\u7684\u673a\u6784\u9996\u6b21\u51fa\u7248\u79d1\u5b66\u671f\u520a\u7684\u5e74\u4efd\u662f\u54ea\u4e00\u5e74\u5462\uff1f<br \/>\n\u601d\u8003\uff1a\u6211\u4eec\u6309\u6b65\u5c31\u73ed\u5730\u601d\u8003\u3002\u9996\u6b21\u7531\u4f4d\u4e8e\u5e03\u6717\u514b\u65af\u7684\u673a\u6784\u51fa\u7248\u7684\u79d1\u5b66\u671f\u520a\u7684\u5e74\u4efd\u662f1916\u5e74\u3002<br \/>\n\u7b54\u6848\uff1a1916\u5e74\uff08\u6807\u7b7e\uff1a1909\u5e74\uff09<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p><strong>\u5931\u8d25\uff1a\u6807\u7b7e\u6b67\u4e49\/Failure: Label ambiguity<\/strong><\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\nQuestion: What nationality is the man who developed the dictator game?<br \/>\nThought 1: I need to search dictator game, find the man who developed it, then find his<br \/>\nnationality.<br \/>\nAction 1: Search[dictator game]<br \/>\nObservation 1: The dictator game is a popular experimental instrument in social psychology<br \/>\nand economics&#8230;<br \/>\nAction 3: Search[Amos Tversky]<br \/>\nObservation 3: Amos Nathan Tversky&#8230;<br \/>\nThought 4: Amos Tversky is an Israeli cognitive and mathematical psychologist. So the<br \/>\nman who developed the dictator game is Israeli.<br \/>\nAction 4: Finish[Israeli] (label: Israel-American)<br \/>\n<strong>CoT<\/strong><br \/>\nQuestion: Kurt Fuller from Stockton, CA appeared in which American Detective Comedy<br \/>\nDrama television series created by Steve Franks?<br \/>\nThought: Let\u2019s think step by step. Kurt Fuller from Stockton, CA appeared in Psych.<br \/>\nPsych is an American Detective Comedy Drama television series created by<br \/>\nSteve Franks.<br \/>\nAnswer: Psych (label: Psych is an American detective comedy-drama)<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<blockquote><p><strong>ReAct<\/strong><br \/>\n\u95ee\u9898\uff1a\u53d1\u660e\u201c\u72ec\u88c1\u8005\u6e38\u620f\u201d\u7684\u90a3\u4e2a\u4eba\u662f\u54ea\u4e2a\u56fd\u5bb6\u7684\uff1f<br \/>\n\u601d\u80031\uff1a\u6211\u9700\u8981\u53bb\u641c\u7d22\u201c\u72ec\u88c1\u8005\u6e38\u620f\u201d\uff0c\u627e\u5230\u53d1\u660e\u5b83\u7684\u4eba\uff0c\u7136\u540e\u67e5\u51fa\u4ed6\u7684\u56fd\u7c4d\u3002<br \/>\n\u884c\u52a81\uff1a\u641c\u7d22[\u72ec\u88c1\u8005\u6e38\u620f]<br \/>\n\u89c2\u5bdf1\uff1a\u72ec\u88c1\u8005\u6e38\u620f\u662f\u4e00\u79cd\u5728\u793e\u4f1a\u5fc3\u7406\u5b66\u548c\u7ecf\u6d4e\u5b66\u4e2d\u5e38\u89c1\u7684\u5b9e\u9a8c\u5de5\u5177\u2026\u2026<br \/>\n\u884c\u52a83\uff1a\u641c\u7d22[Amos Tversky]<br \/>\n\u89c2\u5bdf3\uff1a\u963f\u83ab\u65af\u00b7\u5185\u68ee\u00b7\u7279\u5f17\u65af\u57fa\u2026\u2026<br \/>\n\u601d\u80034\uff1a\u963f\u83ab\u65af\u00b7\u7279\u5f17\u65af\u57fa\u662f\u4ee5\u8272\u5217\u7684\u8ba4\u77e5\u4e0e\u6570\u5b66\u5fc3\u7406\u5b66\u5bb6\u3002\u56e0\u6b64\uff0c\u53d1\u660e\u201c\u72ec\u88c1\u8005\u6e38\u620f\u201d\u7684\u4eba\u662f\u4ee5\u8272\u5217\u4eba\u3002<br \/>\n\u884c\u52a84\uff1a\u7ed3\u675f[\u4ee5\u8272\u5217\u4eba] (\u6807\u7b7e\u6ce8\u91ca\uff1a\u4ee5\u8272\u5217-\u7f8e\u56fd)<br \/>\n<strong>CoT<\/strong><br \/>\n\u95ee\u9898\uff1a\u53f2\u8482\u592b\u00b7\u5f17\u5170\u514b\u521b\u4f5c\u7684\u54ea\u90e8\u7f8e\u56fd\u4fa6\u63a2\u559c\u5267\u7cfb\u5217\u4e2d\u51fa\u73b0\u4e86\u6765\u81ea\u52a0\u5dde\u65af\u6258\u514b\u987f\u7684\u5e93\u7279\u00b7\u5bcc\u52d2\uff1f<br \/>\n\u601d\u8003\uff1a\u8ba9\u6211\u4eec\u9010\u6b65\u6765\u601d\u8003\u3002\u5e93\u7279\u00b7\u5bcc\u52d2\u5728\u300a\u5fc3\u7406\u300b\u4e2d\u51fa\u73b0\u8fc7\u3002\u300a\u5fc3\u7406\u300b\u662f\u7531\u53f2\u8482\u592b\u00b7\u5f17\u5170\u514b\u521b\u4f5c\u7684\u7f8e\u56fd\u4fa6\u63a2\u559c\u5267\u7535\u89c6\u5267\u7cfb\u5217\u3002<br \/>\n\u7b54\u6848\uff1a\u300a\u5fc3\u7406\u300b (\u6807\u7b7e\u6ce8\u91ca\uff1a\u300a\u5fc3\u7406\u300b\u662f\u7f8e\u56fd\u7684\u4e00\u90e8\u4fa6\u63a2\u559c\u5267)<\/p><\/blockquote>\n<p>&nbsp;<\/p>\n<p>&nbsp;<\/p>\n<div style=\"width: 3358px\" class=\"wp-caption aligncenter\"><img loading=\"lazy\" decoding=\"async\" class=\"aligncenter size-full wp-image-2538\" title=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-13\" src=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/6bb41fdad0dfcc2.png\" alt=\"ReAct: \u5927\u8bed\u8a00\u6a21\u578b\u4e2d\u63a8\u7406\u548c\u884c\u52a8\u534f\u540c\u5de5\u4f5c-13\" width=\"3348\" height=\"1990\" srcset=\"https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/6bb41fdad0dfcc2.png 3348w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/6bb41fdad0dfcc2-300x178.png 300w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/6bb41fdad0dfcc2-1024x609.png 1024w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/6bb41fdad0dfcc2-768x456.png 768w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/6bb41fdad0dfcc2-1536x913.png 1536w, https:\/\/www.kdjingpai.com\/wp-content\/uploads\/2024\/04\/6bb41fdad0dfcc2-2048x1217.png 2048w\" sizes=\"auto, (max-width: 3348px) 100vw, 3348px\" \/><p class=\"wp-caption-text\">\u975e\u8bba\u6587\u90e8\u5206\uff0c\u65b9\u4fbf\u7406\u89e3\uff0c\u7b80\u5355\u7684\u68b3\u7406\u903b\u8f91<\/p><\/div>\n","protected":false},"excerpt":{"rendered":"<p>\u539f\u6587\uff1ahttps:\/\/arxiv.org\/pdf\/2210.03629.pdf \u770b\u5b8c\u4e5f\u65e0\u6cd5\u7406\u89e3ReAct\u5982\u4f55\u8fd0\u4f5c\u548c\u5e94\u7528\uff1f\u8bf7\u770b\u300aReAct\u5b9e\u73b0\u903b\u8f91\u5b9e\u64cd\u300b\uff0c\u7528\u5b9e\u9645\u6848\u4f8b\u8fdb\u884c\u8bb2\u89e3\u3002 &nbsp; \u6458\u8981 &nbsp; \u867d\u7136\u5927\u578b\u8bed\u8a00\u6a21\u578b(llm)\u5728\u8bed\u8a00&#8230;<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[34],"tags":[],"class_list":["post-1795","post","type-post","status-publish","format-standard","hentry","category-knowledge"],"_links":{"self":[{"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/posts\/1795","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/comments?post=1795"}],"version-history":[{"count":0,"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/posts\/1795\/revisions"}],"wp:attachment":[{"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/media?parent=1795"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/categories?post=1795"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.kdjingpai.com\/ja\/wp-json\/wp\/v2\/tags?post=1795"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}