{"id":63835,"date":"2025-08-25T17:16:10","date_gmt":"2025-08-25T09:16:10","guid":{"rendered":"https:\/\/swarma.org\/?p=63835"},"modified":"2025-08-25T17:16:10","modified_gmt":"2025-08-25T09:16:10","slug":"%e4%bb%8eq%e5%ad%a6%e4%b9%a0%e5%88%b0ai%e6%b8%b8%e6%88%8f%e5%a4%a7%e5%b8%88%ef%bc%9adqn%e5%a6%82%e4%bd%95%e7%a0%b4%e8%a7%a3%e5%a4%8d%e6%9d%82%e4%bb%bb%e5%8a%a1%ef%bc%9f%e4%b8%a8%e9%9b%86%e6%99%ba","status":"publish","type":"post","link":"https:\/\/swarma.org\/?p=63835","title":{"rendered":"\u4eceQ\u5b66\u4e60\u5230AI\u6e38\u620f\u5927\u5e08\uff1aDQN\u5982\u4f55\u7834\u89e3\u590d\u6742\u4efb\u52a1\uff1f\u4e28\u96c6\u667a\u767e\u79d1"},"content":{"rendered":"<div class='wxsyncmain'>\n<section style=\"margin-bottom: 0px;letter-spacing: 0.544px;font-family: PingFangSC-light;font-size: 15px\" data-mpa-powered-by=\"yiban.io\" data-pm-slice=\"0 0 []\">\n<section style=\"width: 661px;vertical-align: top\">\n<section style=\"margin-top: 10px;letter-spacing: 0.544px\">\n<section style=\"text-align: center\"><img class=\"rich_pages wxw-img\" data-ratio=\"0.5625\" data-s=\"300,640\" data-type=\"png\" data-w=\"1280\" style=\"width:100%\" data-croporisrc=\"https:\/\/mmbiz.qpic.cn\/mmbiz_png\/wibWV1DB7tWLH1ExCHsYrXK9pXoe0JJqj7EUYicwiaxZUtMmDIiaGglbvricMicN448bZNZSibp15qwle4iaLibSrpq7JGA\/0?wx_fmt=png&amp;from=appmsg\" data-cropselx2=\"578\" data-cropsely2=\"241\" data-backw=\"578\" data-backh=\"325\" data-imgfileid=\"100235447\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-152bbf550c2d9d628c4445742871c308.png\" \/><\/section>\n<section style=\"width: 661px\">\n<section style=\"padding-right: 3px;float: left;line-height: 1\">\n<section style=\"text-align: left\">\n<section style=\"padding-left: 10px;width: auto;vertical-align: top;min-width: 10%;height: auto;line-height: 0\">\n<section>\n<section style=\"width: 25px;height: 10px;vertical-align: top;overflow: hidden;line-height: 0;border-style: solid solid none;border-width: 3px 3px 2px;border-radius: 0px\"><span><br \/><\/span><\/section>\n<\/section>\n<section>\n<section style=\"text-align: justify;font-size: 16px;line-height: 1.5\">\n<p><strong><span>\u5bfc\u8bed<\/span><\/strong><\/p>\n<\/section>\n<\/section>\n<section>\n<section style=\"width: 24px;height: 10px;vertical-align: top;overflow: hidden;line-height: 0;border-style: solid solid none;border-width: 3px 3px 2px;border-radius: 0px\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 4px;padding-left: 4px;clear: right;min-height: 4.5em !important\">\n<section style=\"margin-top: 5px;margin-bottom: 5px\">\n<section style=\"padding-right: 8px;padding-left: 8px;font-size: 13px;line-height: 2;letter-spacing: 0.544px\" data-mpa-action-id=\"md85321l1f2\" data-pm-slice=\"0 0 []\">\n<p style=\"clear: none;line-height: 2em\"><strong style=\"letter-spacing: 0.544px;text-indent: 0em;font-size: 15px\"><span style=\"font-size: 13px;letter-spacing: 0.544px\"><span><span>\u6df1\u5ea6Q\u7f51\u7edc(Deep Q-Network, DQN)\u662f\u4e00\u79cd\u57fa\u4e8e\u6df1\u5ea6\u5b66\u4e60\u7684\u5f3a\u5316\u5b66\u4e60\u7b97\u6cd5\uff0c\u5b83\u901a\u8fc7\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u6765\u8fd1\u4f3c\u6700\u4f18\u52a8\u4f5c\u4ef7\u503c\u51fd\u6570\uff08Q\u51fd\u6570\uff09\uff0c\u80fd\u591f\u76f4\u63a5\u4ece\u9ad8\u7ef4\u611f\u77e5\u8f93\u5165\uff08\u5982\u6e38\u620f\u753b\u9762\u50cf\u7d20\uff09\u4e2d\u5b66\u4e60\u6700\u4f18\u51b3\u7b56\u7b56\u7565\u3002\u8be5\u7b97\u6cd5\u7684\u6838\u5fc3\u521b\u65b0\u5728\u4e8e\u7ed3\u5408\u4e86\u7ecf\u9a8c\u56de\u653e\u673a\u5236\u548c\u76ee\u6807\u7f51\u7edc\u6280\u672f\uff0c\u6709\u6548\u89e3\u51b3\u4e86\u4f20\u7edfQ\u5b66\u4e60\u5728\u975e\u7ebf\u6027\u51fd\u6570\u903c\u8fd1\u4e2d\u7684\u7a33\u5b9a\u6027\u95ee\u9898\uff0c\u9996\u6b21\u5728Atari\u6e38\u620f\u4e0a\u5b9e\u73b0\u4e86\u4ece\u539f\u59cb\u50cf\u7d20\u8f93\u5165\u5230\u63a7\u5236\u6307\u4ee4\u7684\u7aef\u5230\u7aef\u5b66\u4e60\uff0c\u8fbe\u5230\u4e86\u4eba\u7c7b\u6c34\u5e73\u7684\u6e38\u620f\u8868\u73b0\u3002<\/span><\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-family: PingFangSC-light;font-style: normal;letter-spacing: 0.544px;text-align: justify;text-indent: 0em;text-transform: none;font-size: 15px\" data-pm-slice=\"0 0 []\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 13px;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><br \/><\/span><\/span><\/strong><\/span><\/strong><\/p>\n<p style=\"clear: none;line-height: 2em\"><strong style=\"letter-spacing: 0.544px;text-indent: 0em;font-size: 15px\"><span style=\"font-size: 13px;letter-spacing: 0.544px\"><span><br \/><\/span><\/span><\/strong><\/p>\n<p style=\"clear: none;line-height: 2em\"><strong style=\"text-indent: 0em;letter-spacing: 0.544px;font-size: 15px\"><span style=\"font-size: 13px;font-family: PingFangSC-light;text-indent: 0em;letter-spacing: 0.578px\"><strong><span>\u201c\u96c6\u667a\u767e\u79d1\u7cbe\u9009\u201d\u662f\u4e00\u4e2a\u957f\u671f\u4e13\u680f\uff0c\u6301\u7eed\u4e3a\u5927\u5bb6\u63a8\u9001\u590d\u6742\u6027\u79d1\u5b66\u76f8\u5173\u7684\u57fa\u672c\u6982\u5ff5\u548c\u8d44\u6e90\u4fe1\u606f\u3002\u4f5c\u4e3a\u96c6\u667a\u4ff1\u4e50\u90e8\u7684\u5f00\u6e90\u79d1\u5b66\u9879\u76ee\uff0c\u96c6\u667a\u767e\u79d1\u5e0c\u671b\u6253\u9020\u590d\u6742\u6027\u79d1\u5b66\u9886\u57df\u6700\u5168\u9762\u7684\u767e\u79d1\u5168\u4e66\uff0c\u6b22\u8fce\u5bf9\u590d\u6742\u6027\u79d1\u5b66\u611f\u5174\u8da3\u3001\u70ed\u7231\u77e5\u8bc6\u6574\u7406\u548c\u5206\u4eab\u7684\u670b\u53cb\u52a0\u5165\uff0c\u6587\u672b\u53ef\u4ee5\u626b\u7801\u62a5\u540d\u52a0\u5165\u767e\u79d1\u5fd7\u613f\u8005\uff01<\/span><\/strong><\/span><\/strong><\/p>\n<p style=\"clear: none;line-height: 2em\"><strong style=\"text-indent: 0em;letter-spacing: 0.544px;font-size: 15px\"><span style=\"font-size: 13px;font-family: PingFangSC-light;text-indent: 0em;letter-spacing: 0.578px\"><strong><span><br \/><\/span><\/strong><\/span><\/strong><\/p>\n<section style=\"text-align: center;margin-bottom: 0px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"1\" data-s=\"300,640\" data-type=\"png\" data-w=\"400\" style=\"width: 152px;height: 152px\" data-imgfileid=\"100234683\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-75dc718999d590d7b9d3a6f3cc7bb077-1.png\" \/><\/section>\n<p style=\"text-align: center\"><span>\u2191\u2191\u2191\u626b\u7801\u76f4\u8fbe\u767e\u79d1\u8bcd\u6761<\/span><\/p>\n<p style=\"clear: none;line-height: 2em\"><strong style=\"text-indent: 0em;letter-spacing: 0.544px;font-size: 15px\"><span style=\"font-size: 13px;font-family: PingFangSC-light;text-indent: 0em;letter-spacing: 0.578px\"><\/span><\/strong><\/p>\n<p><span><br \/><\/span><\/p>\n<\/section>\n<section style=\"padding-right: 8px;padding-left: 8px;font-size: 13px;line-height: 2;letter-spacing: 0.544px\"><span style=\"font-size: 12px\"><strong style=\"letter-spacing: 0.544px\"><strong style=\"letter-spacing: 0.544px\"><strong style=\"letter-spacing: 0.544px\"><strong style=\"text-align: start\"><span>\u5173\u952e\u8bcd\uff1a<\/span><span>\u6df1\u5ea6\u5b66\u4e60\uff0cDeep Q Network\uff0c\u65e0\u6a21\u578b\uff08Model free\uff09\u7b97\u6cd5\uff0c\u52a8\u4f5c\u4ef7\u503c\u51fd\u6570\uff0c\u7ecf\u9a8c\u56de\u653e\uff08Experience Replay)<\/span><\/strong><\/strong><\/strong><\/strong><\/span><\/section>\n<section style=\"padding-right: 8px;padding-left: 8px;font-size: 13px;line-height: 2;letter-spacing: 0.544px\"><strong style=\"letter-spacing: 0.544px\"><strong style=\"letter-spacing: 0.544px\"><\/strong><\/strong><\/section>\n<section style=\"padding-right: 8px;padding-left: 8px;font-size: 13px;line-height: 2;letter-spacing: 0.544px\"><strong style=\"letter-spacing: 0.544px\"><strong style=\"letter-spacing: 0.544px\"><\/strong><\/strong><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"margin-top: 10px\">\n<section style=\"width: 661px\">\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;font-family: PingFangSC-light;font-size: 15px;text-align: center\">\n<section style=\"vertical-align: middle;line-height: 0\"><img class=\"rich_pages wxw-img\" data-ratio=\"0.07314814814814814\" data-type=\"png\" data-w=\"1080\" style=\"vertical-align: middle;width: 677px !important;height: auto !important\" data-fileid=\"100098753\" data-imgfileid=\"100222150\" src=\"\" \/><\/section>\n<\/section>\n<section style=\", Arial, sans-serif;letter-spacing: 0.544px;text-align: right\">\n<p><span style=\"font-family: PingFangSC-light;font-size: 13px;letter-spacing: 0.544px\"><span>\u90b9\u4f73\u73ae\u3001\u7f57\u798f\u6d77<\/span><span>&nbsp;<\/span><\/span><span style=\"font-family: PingFangSC-light;letter-spacing: 0.544px;font-size: 16px;font-weight: bold\"><\/span><span style=\"font-family: PingFangSC-light;letter-spacing: 0.544px;font-size: 13px;font-weight: bold\"><span>| \u7f16\u5199<\/span><\/span><\/p>\n<section style=\", Arial, sans-serif;letter-spacing: 0.544px;text-align: right\">\n<p data-pm-slice=\"3 3 [&quot;para&quot;,{&quot;tagName&quot;:&quot;section&quot;,&quot;attributes&quot;:{&quot;powered-by&quot;:&quot;xiumi.us&quot;,&quot;style&quot;:&quot;-webkit-tap-highlight-color: transparent;outline: 0px;font-family: &quot;PingFang SC&quot;, system-ui, -apple-system, &quot;system-ui&quot;, &quot;Helvetica Neue&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);visibility: visible;text-align: right;&quot;},&quot;namespaceURI&quot;:&quot;http:\/\/www.w3.org\/1999\/xhtml&quot;}]\"><span style=\"font-family: PingFangSC-light;font-size: 13px;letter-spacing: 0.544px\"><span style=\"font-family: PingFangSC-light;font-size: 13px;letter-spacing: 0.544px\"><span data-pm-slice=\"1 1 [&quot;para&quot;,{&quot;tagName&quot;:&quot;section&quot;,&quot;attributes&quot;:{&quot;powered-by&quot;:&quot;xiumi.us&quot;,&quot;style&quot;:&quot;-webkit-tap-highlight-color: transparent;outline: 0px;font-family: &quot;PingFang SC&quot;, system-ui, -apple-system, &quot;system-ui&quot;, &quot;Helvetica Neue&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);visibility: visible;text-align: right;&quot;},&quot;namespaceURI&quot;:&quot;http:\/\/www.w3.org\/1999\/xhtml&quot;},&quot;para&quot;,{&quot;tagName&quot;:&quot;p&quot;,&quot;attributes&quot;:{&quot;style&quot;:&quot;-webkit-tap-highlight-color: transparent;outline: 0px;visibility: visible;&quot;},&quot;namespaceURI&quot;:&quot;http:\/\/www.w3.org\/1999\/xhtml&quot;},&quot;node&quot;,{&quot;tagName&quot;:&quot;span&quot;,&quot;attributes&quot;:{&quot;style&quot;:&quot;-webkit-tap-highlight-color: transparent;outline: 0px;visibility: visible;text-decoration-style: solid;text-decoration-color: rgb(73, 73, 73);color: rgb(73, 73, 73);font-family: PingFangSC-light;font-size: 13px;letter-spacing: 0.544px;background-color: rgb(255, 255, 255);&quot;},&quot;namespaceURI&quot;:&quot;http:\/\/www.w3.org\/1999\/xhtml&quot;}]\">\u5f20\u6c5f<\/span><\/span><span>&nbsp;<\/span><\/span><span style=\"font-family: PingFangSC-light;letter-spacing: 0.544px;font-size: 16px;font-weight: bold\"><\/span><span style=\"font-family: PingFangSC-light;letter-spacing: 0.544px;font-size: 13px;font-weight: bold\"><span>| \u5ba1\u6821<\/span><\/span><\/p>\n<\/section>\n<p><span style=\"font-family: PingFangSC-light;letter-spacing: 0.544px;font-size: 13px;font-weight: bold\"><span><br \/><\/span><\/span><\/p>\n<\/section>\n<section style=\"margin-bottom: 0px;letter-spacing: 0.544px;, Arial, sans-serif\">\n<section style=\"margin-right: 8px;margin-left: 8px;letter-spacing: 0.544px;line-height: 1.75em\">\n<section data-id=\"85410\" data-tools=\"135\u7f16\u8f91\u5668\" style=\"letter-spacing: 0.54px\">\n<section style=\"margin: 10px auto\">\n<section style=\"margin-right: 3px;margin-left: 3px;padding: 20px\" data-mpa-action-id=\"megnjzor1d3a\" data-pm-slice=\"0 0 []\">\n<p style=\"text-align: left;margin-left: 0px;margin-right: 0px\"><strong style=\"letter-spacing: 0.54px;font-size: 16px\"><span>\u76ee\u5f55<\/span><\/strong><\/p>\n<section><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold;font-size: 15px\"><span>1.&nbsp;<span style=\"font-weight: bold\">\u80cc\u666f<\/span><\/span><\/span><\/span><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>1.1\t\u5f3a\u5316\u5b66\u4e60\u7684\u57fa\u672c\u6982\u5ff5\u4e0e\u6311\u6218<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>1.1.1\t\u57fa\u672c\u6982\u5ff5<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>1.1.2\t\u9762\u4e34\u7684\u6311\u6218<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>1.2\tQ-Learning \u7b80\u4ecb<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>1.3\t\u6df1\u5ea6\u5b66\u4e60\u4e0e\u5f3a\u5316\u5b66\u4e60\u7684\u878d\u5408\u80cc\u666f<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>1.4\tDQN \u7684\u63d0\u51fa\u53ca\u5176\u5728 Atari \u6e38\u620f\u4e2d\u7684\u7a81\u7834\u6027\u6210\u679c<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>1.4.1\t\u63d0\u51fa\u7684\u6a21\u578b<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>1.4.2\t\u6a21\u578b\u7684\u7ec6\u8282<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>1.4.3\t\u5177\u4f53\u7b97\u6cd5\u53ca\u5176\u8bad\u7ec3\u6d41\u7a0b<\/span><\/span><\/p>\n<p><span style=\"font-size: 15px\"><span style=\"font-weight: bold\">2. Q-Learning \u57fa\u7840<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>2.1\t\u9a6c\u5c14\u53ef\u592b\u51b3\u7b56\u8fc7\u7a0b\uff08MDP\uff09\u7b80\u4ecb<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>2.1.1\tMDP \u7684\u6838\u5fc3\u601d\u60f3<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>2.1.2\t\u7b56\u7565\u4e0e\u4ef7\u503c\u51fd\u6570<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>2.2\tQ \u503c\u51fd\u6570\u7684\u5b9a\u4e49\u4e0e\u66f4\u65b0\u516c\u5f0f<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>2.2.1\t\u5b9a\u4e49<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>2.2.2\t\u66f4\u65b0\u516c\u5f0f<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>2.3\t\u03b5-greedy \u7b56\u7565\u4e0e\u63a2\u7d22-\u5229\u7528\u6743\u8861<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>2.4\tQ-Learning \u7684\u6536\u655b\u6027<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>2.5\tQ-Learning \u7684\u5c40\u9650\u6027<\/span><\/span><\/p>\n<p><span style=\"font-size: 15px\"><span style=\"font-weight: bold\">3. DQN \u7684\u6838\u5fc3\u601d\u60f3\u4e0e\u7ed3\u6784<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>3.1\t\u4f7f\u7528\u795e\u7ecf\u7f51\u7edc\u903c\u8fd1 Q \u503c\u51fd\u6570<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>3.2\t\u7ecf\u9a8c\u56de\u653e\uff08Experience Replay\uff09\u673a\u5236<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>3.3\t\u76ee\u6807\u7f51\u7edc\uff08Target Network\uff09\u7684\u5f15\u5165\u4e0e\u53c2\u6570\u66f4\u65b0\u7b56\u7565<\/span><\/span><\/p>\n<p><span style=\"font-size: 15px\"><span style=\"font-weight: bold\">4. DQN\u5728pytorch\u4e2d\u7684\u7b80\u5355\u5b8c\u6574\u5b9e\u73b0<\/span><\/span><\/p>\n<p><span style=\"font-size: 15px\"><span style=\"font-weight: bold\">5. DQN \u7684\u4e3b\u8981\u6539\u8fdb\u7b97\u6cd5<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>5.1\tDouble DQN\uff1a\u89e3\u51b3 Q \u503c\u8fc7\u9ad8\u4f30\u8ba1\u95ee\u9898<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>5.1.1\tDouble DQN\u7684\u601d\u60f3<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>5.1.2\tDouble DQN\u7684\u4f18\u52bf<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>5.2\tDueling DQN\uff1a\u5206\u79bb\u72b6\u6001\u4ef7\u503c\u4e0e\u4f18\u52bf\u51fd\u6570<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>5.2.1\tDueling DQN\u7684\u601d\u60f3<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>5.2.2\tDueling DQN\u7684\u4f18\u52bf<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>5.3\tDRQN<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>5.3.1\tDRQN\u7684\u601d\u60f3<\/span><\/span><\/p>\n<p style=\"margin-left: 16px;margin-right: 16px\"><span style=\"font-size: 15px\"><span>5.3.2\tDRQN\u7684\u4f18\u52bf\u4e0e\u5c40\u9650<\/span><\/span><\/p>\n<p><span style=\"font-size: 15px\"><span style=\"font-weight: bold\">6. DQN \u7684\u5e94\u7528\u9886\u57df<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>6.1\tAtari \u6e38\u620f\u4e2d\u7684\u5e94\u7528\u4e0e\u8868\u73b0<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>6.2\t\u673a\u5668\u4eba\u63a7\u5236\u4e0e\u8def\u5f84\u89c4\u5212<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>6.3\t\u63a8\u8350\u7cfb\u7edf\u4e2d\u7684\u7b56\u7565\u4f18\u5316<\/span><\/span><\/p>\n<p><span style=\"font-size: 15px\"><span style=\"font-weight: bold\">7. DQN \u7684\u5c40\u9650\u6027\u4e0e\u6311\u6218<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>7.1\t\u5bf9\u8fde\u7eed\u52a8\u4f5c\u7a7a\u95f4\u7684\u5904\u7406\u56f0\u96be<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>7.2\t\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u7684\u6837\u672c\u6548\u7387\u95ee\u9898<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>7.3\t\u7b56\u7565\u6536\u655b\u901f\u5ea6\u6162\u4e0e\u7a33\u5b9a\u6027\u95ee\u9898<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px\"><span style=\"font-size: 15px\"><span>7.4\t\u6cdb\u5316\u80fd\u529b\u4e0e\u8fc7\u62df\u5408\u98ce\u9669<\/span><\/span><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<h2 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 24px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h2>\n<h3 style=\", Arial, sans-serif;letter-spacing: 0.544px\">\n<section style=\"letter-spacing: 0.544px;text-align: right;font-size: 13px\">\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;text-align: center\">\n<section style=\"vertical-align: middle\">\n<section style=\"margin-bottom: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 1.4\">\n<p><strong><strong style=\"text-align: left;letter-spacing: 0.544px\"><span style=\", Arial, sans-serif\"><strong style=\"letter-spacing: 0.578px\"><span>1. \u80cc\u666f<\/span><\/strong><\/span><\/strong><\/strong><\/p>\n<\/section>\n<section style=\"margin-top: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.1 \u5f3a\u5316\u5b66\u4e60\u7684\u57fa\u672c\u6982\u5ff5\u4e0e\u6311\u6218<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.1.1 \u57fa\u672c\u6982\u5ff5<\/span><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5f3a\u5316\u5b66\u4e60\uff08Reinforcement Learning, RL\uff09\u662f\u4e00\u79cd\u673a\u5668\u5b66\u4e60\u65b9\u6cd5\uff0c\u5f3a\u8c03\u667a\u80fd\u4f53\uff08agent\uff09\u901a\u8fc7\u4e0e\u73af\u5883\u7684\u4ea4\u4e92\uff0c\u5728\u8bd5\u9519\u8fc7\u7a0b\u4e2d\u5b66\u4e60\u7b56\u7565\uff0c\u4ee5\u6700\u5927\u5316\u7d2f\u79ef\u5956\u52b1\u3002\u5176\u6838\u5fc3\u5728\u4e8e\u89e3\u51b3\u201c\u63a2\u7d22-\u5229\u7528\u201d\u4e4b\u95f4\u7684\u6743\u8861\uff1a\u65e2\u8981\u5c1d\u8bd5\u65b0\u7684\u52a8\u4f5c\u4ee5\u53d1\u73b0\u6f5c\u5728\u7684\u9ad8\u5956\u52b1\u7b56\u7565\uff08\u63a2\u7d22\uff09\uff0c\u53c8\u8981\u5229\u7528\u5df2\u77e5\u7684\u6700\u4f18\u7b56\u7565\u4ee5\u83b7\u5f97\u5373\u65f6\u6536\u76ca\uff08\u5229\u7528\uff09 \u3002<\/span><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.1.2 \u9762\u4e34\u7684\u6311\u6218<\/span><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5c3d\u7ba1\u5f3a\u5316\u5b66\u4e60\u5728\u6e38\u620fAI\u3001\u673a\u5668\u4eba\u63a7\u5236\u3001\u63a8\u8350\u7cfb\u7edf\u7b49\u9886\u57df\u53d6\u5f97\u4e86\u663e\u8457\u6210\u679c\uff0c\u4f46\u5728\u5b9e\u9645\u5e94\u7528\u4e2d\u4ecd\u9762\u4e34\u8bf8\u591a\u6311\u6218\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09\u6837\u672c\u6548\u7387\u4f4e\uff1a\u5f3a\u5316\u5b66\u4e60\u901a\u5e38\u9700\u8981\u5927\u91cf\u7684\u4ea4\u4e92\u6570\u636e\u624d\u80fd\u5b66\u4e60\u6709\u6548\u7b56\u7565\uff0c\u8fd9\u5728\u6570\u636e\u83b7\u53d6\u6210\u672c\u9ad8\u6216\u4ea4\u4e92\u53d7\u9650\u7684\u573a\u666f\u4e2d\u5c24\u4e3a\u56f0\u96be\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09\u6cdb\u5316\u80fd\u529b\u5f31\uff1a\u5728\u7279\u5b9a\u73af\u5883\u4e2d\u8bad\u7ec3\u51fa\u7684\u7b56\u7565\uff0c\u5f80\u5f80\u96be\u4ee5\u9002\u5e94\u7a0d\u6709\u53d8\u5316\u7684\u65b0\u73af\u5883\uff0c\u7f3a\u4e4f\u8fc1\u79fb\u5b66\u4e60\u80fd\u529b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09\u5956\u52b1\u8bbe\u8ba1\u56f0\u96be\uff1a\u8bbe\u8ba1\u5408\u9002\u7684\u5956\u52b1\u51fd\u6570\u81f3\u5173\u91cd\u8981\uff0c\u4e0d\u5f53\u7684\u5956\u52b1\u8bbe\u8ba1\u53ef\u80fd\u5bfc\u81f4\u667a\u80fd\u4f53\u5b66\u4e60\u5230\u4e0e\u9884\u671f\u4e0d\u7b26\u7684\u884c\u4e3a\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff084\uff09\u8bad\u7ec3\u7a33\u5b9a\u6027\u4e0e\u6536\u655b\u6027\u95ee\u9898\uff1a\u7279\u522b\u662f\u5728\u57fa\u4e8e\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u7684\u6a21\u578b\u4e2d\uff0c\u8bad\u7ec3\u8fc7\u7a0b\u53ef\u80fd\u4e0d\u7a33\u5b9a\uff0c\u5bb9\u6613\u53d1\u751f\u53d1\u6563\u3002\u7b56\u7565\u6216\u73af\u5883\u7684\u5fae\u5c0f\u53d8\u5316\u53ef\u80fd\u5bfc\u81f4\u6027\u80fd\u7684\u6781\u5927\u6ce2\u52a8\uff0c\u4f7f\u5f97\u96be\u4ee5\u83b7\u5f97\u4e00\u81f4\u7684\u7ed3\u679c\u3002\u5728\u8fde\u7eed\u6216\u9ad8\u7ef4\u52a8\u4f5c\u7a7a\u95f4\u7684\u60c5\u51b5\u4e0b\uff0c\u8fd9\u79cd\u4e0d\u7a33\u5b9a\u6027\u66f4\u52a0\u660e\u663e\uff0c\u5b66\u4e60\u8fc7\u7a0b\u53d8\u5f97\u66f4\u590d\u6742\u4e14\u96be\u4ee5\u9884\u6d4b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.2 Q-Learning \u7b80\u4ecb<\/span><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q-Learning \u662f\u5f3a\u5316\u5b66\u4e60\u4e2d\u4e00\u79cd\u7ecf\u5178\u4e14\u5e7f\u6cdb\u5e94\u7528\u7684\u65e0\u6a21\u578b\uff08model-free\uff09\u7b97\u6cd5\uff0c\u5c5e\u4e8e\u57fa\u4e8e\u503c\uff08value-based\uff09\u7684\u65b9\u6cd5\u3002\u5176\u6838\u5fc3\u76ee\u6807\u662f\u901a\u8fc7\u5b66\u4e60\u4e00\u4e2a\u52a8\u4f5c\u4ef7\u503c\u51fd\u6570\uff08Q\u51fd\u6570\uff09\uff0c\u6307\u5bfc\u667a\u80fd\u4f53\u5728\u4e0d\u540c\u72b6\u6001\u4e0b\u9009\u62e9\u6700\u4f18\u52a8\u4f5c\uff0c\u4ee5\u6700\u5927\u5316\u957f\u671f\u7d2f\u79ef\u5956\u52b1\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3e\u4f8b\u8001\u9f20\u5728\u8ff7\u5bab\u4e2d\u5bfb\u627e\u5976\u916a\u6765\u7406\u89e3Q-Learning \uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09\u73af\u5883\u8bbe\u5b9a<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u667a\u80fd\u4f53\uff08Agent\uff09\uff1a\u4e00\u53ea\u8001\u9f20\uff0c\u8d77\u59cb\u4f4d\u7f6e\u56fa\u5b9a\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u76ee\u6807\uff08Goal\uff09\uff1a\u5728\u8ff7\u5bab\u7684\u53f3\u4e0b\u89d2\u6709\u4e00\u5757\u5976\u916a\uff0c\u8001\u9f20\u7684\u4efb\u52a1\u662f\u627e\u5230\u5e76\u5403\u5230\u5976\u916a\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u969c\u788d\uff08Obstacle\uff09\uff1a\u8ff7\u5bab\u4e2d\u67d0\u4e9b\u4f4d\u7f6e\u6709\u6bd2\u836f\uff0c\u8001\u9f20\u9700\u8981\u907f\u514d\u8fd9\u4e9b\u4f4d\u7f6e\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u4f5c\uff08Actions\uff09\uff1a\u8001\u9f20\u53ef\u4ee5\u9009\u62e9\u5411\u4e0a\u3001\u4e0b\u3001\u5de6\u3001\u53f3\u79fb\u52a8\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5956\u52b1\uff08Rewards\uff09\uff1a\u5403\u5230\u5976\u916a\uff1a+10\uff1b\u8bef\u5165\u6bd2\u836f\uff1a-10\uff1b\u5176\u4ed6\u79fb\u52a8\uff1a0<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09Q-Learning \u5b66\u4e60\u8fc7\u7a0b<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8001\u9f20\u901a\u8fc7\u4e0d\u65ad\u5c1d\u8bd5\u4e0d\u540c\u7684\u8def\u5f84\uff0c\u5b66\u4e60\u5982\u4f55\u4ece\u8d77\u70b9\u79fb\u52a8\u5230\u5976\u916a\u6240\u5728\u7684\u4f4d\u7f6e\uff0c\u540c\u65f6\u907f\u514d\u6bd2\u836f\u3002\u6bcf\u6b21\u79fb\u52a8\u540e\uff0c\u8001\u9f20\u6839\u636e\u83b7\u5f97\u7684\u5956\u52b1\u66f4\u65b0\u5176\u5bf9\u5f53\u524d\u72b6\u6001\u4e0b\u5404\u4e2a\u52a8\u4f5c\u7684\u4ef7\u503c\u4f30\u8ba1\uff08\u5373 Q \u503c\uff09\u3002\u968f\u7740\u5b66\u4e60\u7684\u8fdb\u884c\uff0c\u8001\u9f20\u9010\u6e10\u5f62\u6210\u4e00\u5957\u7b56\u7565\uff0c\u4f7f\u5176\u80fd\u591f\u66f4\u5feb\u3001\u66f4\u5b89\u5168\u5730\u627e\u5230\u5976\u916a\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09Q \u503c\u66f4\u65b0\u516c\u5f0f<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q-Learning \u7684\u6838\u5fc3\u5728\u4e8e\u901a\u8fc7\u4ee5\u4e0b\u516c\u5f0f\u66f4\u65b0 Q \u503c\uff1a&nbsp;<\/span><\/span><\/span><\/p>\n<section style=\"text-align: center\"><img class=\"rich_pages wxw-img\" data-ratio=\"0.07603686635944701\" data-s=\"300,640\" data-type=\"png\" data-w=\"2604\" style=\"width:452px;height:34px\" data-imgfileid=\"100235148\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-b70a92613ec86491c392a3113f2e941a.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5176\u4e2d\uff1a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"megnq28021ya\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5f53\u524d\u72b6\u6001\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"megnq4if1l4b\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5f53\u524d\u52a8\u4f5c\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"megnq6il17dl\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5373\u65f6\u5956\u52b1\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u6267\u884c\u52a8\u4f5c\u540e\u7684\u65b0\u72b6\u6001\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2208<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5b66\u4e60\u7387\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b3<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2208<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u6298\u6263\u56e0\u5b50<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff084\uff09\u7b56\u7565\u9009\u62e9\uff1a\u03b5-\u8d2a\u5a6a\u7b56\u7565<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u4e86\u5728\u63a2\u7d22\u65b0\u8def\u5f84\u548c\u5229\u7528\u5df2\u77e5\u6700\u4f73\u8def\u5f84\u4e4b\u95f4\u53d6\u5f97\u5e73\u8861\uff0c\u91c7\u7528 \u03b5-\u8d2a\u5a6a\u7b56\u7565\uff1a<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4ee5\u6982\u7387 \u03b5 \u968f\u673a\u9009\u62e9\u4e00\u4e2a\u52a8\u4f5c\uff08\u63a2\u7d22\uff09<\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4ee5\u6982\u7387 1 &#8211; \u03b5 \u9009\u62e9\u5f53\u524d Q \u503c\u6700\u5927\u7684\u52a8\u4f5c\uff08\u5229\u7528\uff09<\/span><\/span><\/section>\n<\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u968f\u7740\u8bad\u7ec3\u7684\u8fdb\u884c\uff0c\u9010\u6e10\u51cf\u5c0f \u03b5 \u7684\u503c\uff0c\u4ee5\u51cf\u5c11\u63a2\u7d22\uff0c\u589e\u52a0\u5229\u7528\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff085\uff09\u5b66\u4e60\u8fc7\u7a0b<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4ee5\u4e0b\u662f\u8001\u9f20\u5728\u8ff7\u5bab\u4e2d\u5b66\u4e60\u7684\u7b80\u8981\u8fc7\u7a0b\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a.\u521d\u59cb\u5316<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5c06\u6240\u6709\u72b6\u6001-\u52a8\u4f5c\u5bf9\u7684 Q \u503c\u521d\u59cb\u5316\u4e3a 0\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>b.\u9009\u62e9\u52a8\u4f5c<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u6839\u636e \u03b5-\u8d2a\u5a6a\u7b56\u7565\u9009\u62e9\u4e00\u4e2a\u52a8\u4f5c\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>c.\u6267\u884c\u52a8\u4f5c<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u8001\u9f20\u79fb\u52a8\u5230\u65b0\u7684\u4f4d\u7f6e\uff0c\u83b7\u5f97\u76f8\u5e94\u7684\u5956\u52b1\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>d.\u66f4\u65b0 Q \u503c<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u6839\u636e Q \u503c\u66f4\u65b0\u516c\u5f0f\uff0c\u66f4\u65b0\u5f53\u524d\u72b6\u6001\u4e0b\u8be5\u52a8\u4f5c\u7684 Q \u503c\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>e.\u91cd\u590d<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5c06\u65b0\u4f4d\u7f6e\u4f5c\u4e3a\u5f53\u524d\u72b6\u6001\uff0c\u91cd\u590d\u6b65\u9aa4 2 \u81f3 4\uff0c\u76f4\u5230\u8fbe\u5230\u7ec8\u6b62\u6761\u4ef6\uff08\u5982\u627e\u5230\u5976\u916a\u6216\u8fbe\u5230\u6700\u5927\u6b65\u6570\uff09\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u901a\u8fc7\u591a\u6b21\u8fed\u4ee3\uff0c\u8001\u9f20\u80fd\u591f\u5b66\u4e60\u5230\u4ece\u8d77\u70b9\u5230\u5976\u916a\u7684\u6700\u4f18\u8def\u5f84\uff0c\u540c\u65f6\u907f\u514d\u6bd2\u836f\u3002\u8be5\u793a\u4f8b\u5c55\u793a\u4e86 Q-Learning \u5982\u4f55\u901a\u8fc7\u4e0e\u73af\u5883\u7684\u4ea4\u4e92\uff0c\u5b66\u4e60\u6700\u4f18\u7b56\u7565\u4ee5\u6700\u5927\u5316\u7d2f\u79ef\u5956\u52b1\u3002\u901a\u8fc7\u4e0d\u65ad\u66f4\u65b0 Q \u503c\uff0c\u667a\u80fd\u4f53\u80fd\u591f\u5728\u590d\u6742\u7684\u73af\u5883\u4e2d\u627e\u5230\u6700\u4f18\u8def\u5f84\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.3 \u6df1\u5ea6\u5b66\u4e60\u4e0e\u5f3a\u5316\u5b66\u4e60\u7684\u878d\u5408\u80cc\u666f<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6df1\u5ea6\u5b66\u4e60\u4e0e\u5f3a\u5316\u5b66\u4e60\u7684\u878d\u5408\u8d77\u6e90\u4e8e\u4e24\u8005\u4e92\u8865\u7684\u4f18\u52bf\uff1a\u5f3a\u5316\u5b66\u4e60\u64c5\u957f\u51b3\u7b56\u4e0e\u7b56\u7565\u4f18\u5316\uff0c\u800c\u6df1\u5ea6\u5b66\u4e60\u64c5\u957f\u5904\u7406\u9ad8\u7ef4\u611f\u77e5\u6570\u636e\uff08\u5982\u56fe\u50cf\u3001\u8bed\u97f3\u3001\u6587\u672c\u7b49\uff09\u3002\u4f20\u7edf\u5f3a\u5316\u5b66\u4e60\u65b9\u6cd5\u5728\u9762\u5bf9\u5927\u89c4\u6a21\u72b6\u6001\u7a7a\u95f4\uff08\u4f8b\u5982\u56fe\u50cf\u8f93\u5165\uff09\u65f6\uff0c\u56e0\u65e0\u6cd5\u4f7f\u7528\u67e5\u8868\u7684\u65b9\u5f0f\u5b58\u50a8 Q \u503c\u800c\u8868\u73b0\u4e0d\u4f73\u3002\u4e3a\u4e86\u89e3\u51b3\u8fd9\u4e00\u74f6\u9888\uff0c\u7814\u7a76\u8005\u5f15\u5165\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u4f5c\u4e3a\u51fd\u6570\u903c\u8fd1\u5668\uff0c\u7528\u4ee5\u4f30\u8ba1\u72b6\u6001-\u52a8\u4f5c\u503c\u51fd\u6570\uff08Q \u503c\uff09\u6216\u7b56\u7565\u51fd\u6570\uff0c\u4ece\u800c\u5927\u5e45\u63d0\u5347\u4e86\u5f3a\u5316\u5b66\u4e60\u5728\u590d\u6742\u73af\u5883\u4e2d\u7684\u6cdb\u5316\u80fd\u529b\u548c\u5b9e\u7528\u6027\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u4e00\u878d\u5408\u7684\u4ee3\u8868\u6027\u6210\u679c\u662f 2015 \u5e74 DeepMind \u63d0\u51fa\u7684\u6df1\u5ea6 Q \u7f51\u7edc\uff08DQN\uff09<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[1]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u9996\u6b21\u5728\u65e0\u9700\u4eba\u5de5\u7279\u5f81\u8bbe\u8ba1\u7684\u60c5\u51b5\u4e0b\uff0c\u4ec5\u51ed\u50cf\u7d20\u8f93\u5165\u4fbf\u5728\u591a\u6b3e Atari \u6e38\u620f\u4e2d\u5b9e\u73b0\u4e86\u8d85\u8d8a\u4eba\u7c7b\u6c34\u5e73\u7684\u8868\u73b0\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.4 DQN \u7684\u63d0\u51fa\u53ca\u5176\u5728 Atari \u6e38\u620f\u4e2d\u7684\u7a81\u7834\u6027\u6210\u679c<\/span><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"text-align: center;margin-bottom: 0px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"1.193220338983051\" data-s=\"300,640\" data-type=\"gif\" data-w=\"295\" data-imgfileid=\"100235149\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-79d1be4c1c668c8de5c60f11dca134e2.gif\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 15px\" data-mpa-action-id=\"megnsqh21ue0\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>\u4e3e\u4f8b\uff1aAtari\u6e38\u620f\u4e4bbreakout\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>[1]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Deep Q-Network\uff08DQN\uff09\u662f\u7531DeepMind\u56e2\u961f\u57282015\u5e74\u53d1\u8868\u7684\u8bba\u6587<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[1]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e2d\u63d0\u51fa\u7684\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u7b97\u6cd5\u3002\u8be5\u7814\u7a76\u9996\u6b21\u5c06\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u4e0eQ-learning\u7ed3\u5408\uff0c\u76f4\u63a5\u4ece\u9ad8\u7ef4\u611f\u5b98\u8f93\u5165\uff08\u5982Atari\u6e38\u620f\u7684\u50cf\u7d20\uff09\u5b66\u4e60\u63a7\u5236\u7b56\u7565\uff0c\u800c\u65e0\u9700\u624b\u5de5\u8bbe\u8ba1\u7279\u5f81\u3002DQN\u5728Atari 2600\u6e38\u620f\u4e0a\u7684\u8868\u73b0\u8fbe\u5230\u6216\u8d85\u8d8a\u4eba\u7c7b\u6c34\u5e73\uff0c\u6807\u5fd7\u7740\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u5728\u590d\u6742\u4efb\u52a1\u4e2d\u7684\u91cd\u5927\u7a81\u7834\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN\u7684\u6838\u5fc3\u521b\u65b0\u5305\u62ec\u4f7f\u7528\u6df1\u5ea6\u5377\u79ef\u795e\u7ecf\u7f51\u7edc(CNN)\u5904\u7406\u539f\u59cb\u50cf\u7d20\u8f93\u5165\uff0c\u6a21\u4eff\u751f\u7269\u89c6\u89c9\u7cfb\u7edf\u7684\u5c42\u6b21\u5316\u7279\u5f81\u63d0\u53d6\u80fd\u529b\u3002\u6b64\u5916\uff0c\u4e3a\u4e86\u89e3\u51b3\u4f20\u7edf\u5f3a\u5316\u5b66\u4e60\u5728\u975e\u7ebf\u6027\u51fd\u6570\u903c\u8fd1\u4e0b\u7684\u4e0d\u7a33\u5b9a\u6027\uff0cDQN\u5f15\u5165\u4e86<\/span><\/span><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7ecf\u9a8c\u56de\u653e\uff08Experience Replay)<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u673a\u5236\uff0c\u901a\u8fc7\u5b58\u50a8\u5e76\u968f\u673a\u91c7\u6837\u5386\u53f2\u7ecf\u9a8c\u6765\u6253\u7834\u6570\u636e\u76f8\u5173\u6027\uff0c\u63d0\u9ad8\u8bad\u7ec3\u7a33\u5b9a\u6027\u3002\u540c\u65f6\uff0c\u91c7\u7528\u76ee\u6807\u7f51\u7edc\u5206\u79bb\u6280\u672f\uff0c\u5b9a\u671f\u51bb\u7ed3\u76ee\u6807Q\u7f51\u7edc\u7684\u53c2\u6570\uff0c\u51cf\u5c11\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u7684\u6ce2\u52a8\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728\u5b9e\u9a8c\u4e2d\uff0cDQN\u572849\u6b3eAtari 2600\u6e38\u620f\u4e0a\u8fdb\u884c\u6d4b\u8bd5\uff0c\u4ec5\u4ee5\u6e38\u620f\u5c4f\u5e55\u50cf\u7d20\u548c\u5206\u6570\u4f5c\u4e3a\u8f93\u5165\uff0c\u4f7f\u7528\u76f8\u540c\u7684\u7f51\u7edc\u67b6\u6784\u548c\u8d85\u53c2\u6570\u3002\u7ed3\u679c\u663e\u793a\uff0cDQN\u572843\u6b3e\u6e38\u620f\u4e2d\u8d85\u8d8a\u4e86\u6b64\u524d\u6240\u6709\u5f3a\u5316\u5b66\u4e60\u65b9\u6cd5\uff0c\u5e76\u572829\u6b3e\u6e38\u620f\u4e2d\u8fbe\u5230\u4eba\u7c7b\u4e13\u4e1a\u6d4b\u8bd5\u5458\u6c34\u5e73\u768475%\u4ee5\u4e0a\u3002\u4f8b\u5982\uff0c\u5728\u201cBreakout\u201d\u4e2d\uff0cDQN\u81ea\u4e3b\u53d1\u73b0\u201c\u4fa7\u8fb9\u6316\u96a7\u9053\u201d\u7684\u9ad8\u5206\u7b56\u7565\uff0c\u6700\u7ec8\u5f97\u5206\u8fdc\u8d85\u4eba\u7c7b\u73a9\u5bb6\uff1b\u5728\u201cSpace Invaders\u201d\u4e2d\uff0cDQN\u5b66\u4f1a\u5ffd\u7565\u65e0\u5173\u89c6\u89c9\u7279\u5f81\uff0c\u4e13\u6ce8\u4e8e\u5173\u952e\u72b6\u6001\u4ef7\u503c\u9884\u6d4b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN\u7684\u6210\u529f\u4e0d\u4ec5\u9a8c\u8bc1\u4e86\u7aef\u5230\u7aef\u5f3a\u5316\u5b66\u4e60\u7684\u53ef\u884c\u6027\uff0c\u8fd8\u63ed\u793a\u4e86\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u4e0e\u751f\u7269\u5b66\u4e60\u673a\u5236\u7684\u76f8\u4f3c\u6027\uff0c\u5982\u7ecf\u9a8c\u56de\u653e\u4e0e\u6d77\u9a6c\u4f53\u8bb0\u5fc6\u91cd\u653e\u7684\u7c7b\u6bd4\u3002\u7136\u800c\uff0cDQN\u4ecd\u5b58\u5728\u8bad\u7ec3\u6570\u636e\u9700\u6c42\u5927\u3001\u5bf9\u8d85\u957f\u7a0b\u89c4\u5212\u4efb\u52a1\uff08\u5982\u201cMontezuma\u2019s Revenge\u201d\u8868\u73b0\u6709\u9650\u7b49\u6311\u6218\u3002\u5c3d\u7ba1\u5982\u6b64\uff0cDQN\u4e3a\u540e\u7eed\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u7814\u7a76\u5960\u5b9a\u4e86\u57fa\u7840\uff0c\u63a8\u52a8\u4e86\u4ece\u6e38\u620fAI\u5230\u673a\u5668\u4eba\u63a7\u5236\u7b49\u9886\u57df\u7684\u5e7f\u6cdb\u5e94\u7528\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.4.1 \u63d0\u51fa\u7684\u6a21\u578b<\/span><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"text-align: center;margin-bottom: 0px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"0.494\" data-s=\"300,640\" data-type=\"jpeg\" data-w=\"1000\" data-imgfileid=\"100235150\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-2c2c84494573aeeb1f99028060557ce9.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 15px\" data-mpa-action-id=\"megntdri14tc\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>\u6a21\u578b\u793a\u610f\u56fe\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>[1]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8be5\u793a\u610f\u56fe\u5c55\u793a\u4e86\u6df1\u5ea6Q\u7f51\u7edc\uff08DQN\uff09\u7684\u5178\u578b\u67b6\u6784\u8bbe\u8ba1\uff0c\u76f4\u89c2\u5448\u73b0\u4e86\u4ece\u539f\u59cb\u6e38\u620f\u753b\u9762\u5230\u63a7\u5236\u6307\u4ee4\u7684\u7aef\u5230\u7aef\u5904\u7406\u6d41\u7a0b\u3002\u7cfb\u7edf\u91c7\u7528\u591a\u7ea7\u7279\u5f81\u63d0\u53d6\u67b6\u6784\uff0c\u5de6\u4fa7\u8f93\u5165\u5c42\u63a5\u6536\u9884\u5904\u7406\u540e\u7684\u6e38\u620f\u753b\u9762\uff0884\u00d784\u50cf\u7d20\uff0c4\u5e27\u5806\u53e0\uff09\uff0c\u901a\u8fc7\u4e24\u4e2a\u5377\u79ef\u5c42\uff08Convolution\uff09\u8fdb\u884c\u7a7a\u95f4\u7279\u5f81\u63d0\u53d6\uff0c\u5176\u4e2d\u7f51\u683c\u72b6\u7ed3\u6784\u8868\u793a\u5377\u79ef\u6838\u5728\u7a7a\u95f4\u7ef4\u5ea6\u4e0a\u7684\u7279\u5f81\u6620\u5c04\u8fc7\u7a0b\u3002\u968f\u540e\u7ecf\u7531\u4e24\u4e2a\u5168\u8fde\u63a5\u5c42\uff08Fully connected\uff09\u5b9e\u73b0\u9ad8\u7ea7\u7279\u5f81\u7684\u62bd\u8c61\u4e0e\u7ec4\u5408\uff0c\u6700\u7ec8\u8f93\u51fa\u5c42\u4e0e\u6e38\u620f\u624b\u67c4\u63a7\u5236\u6307\u4ee4\u76f4\u63a5\u5173\u8054\uff0c\u4f5c\u4e3a\u6839\u636e\u5b66\u5230\u7684\u52a8\u4f5c\u4ef7\u503cQ\u6765\u9009\u62e9\u52a8\u4f5c\u3002\u8be5\u67b6\u6784\u8bbe\u8ba1\u5145\u5206\u4f53\u73b0\u4e86DQN\u76f4\u63a5\u4ece\u539f\u59cb\u50cf\u7d20\u5b66\u4e60\u63a7\u5236\u7b56\u7565\u7684\u6838\u5fc3\u601d\u60f3\uff0c\u901a\u8fc7\u5377\u79ef\u795e\u7ecf\u7f51\u7edc\u7684\u7279\u5f81\u63d0\u53d6\u80fd\u529b\u4e0e\u5f3a\u5316\u5b66\u4e60\u7684\u51b3\u7b56\u673a\u5236\u76f8\u7ed3\u5408\uff0c\u5b9e\u73b0\u4e86\u4ece\u611f\u77e5\u5230\u884c\u52a8\u7684\u5b8c\u6574\u6620\u5c04\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.4.2 \u6a21\u578b\u7684\u7ec6\u8282<\/span><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8be5\u7814\u7a76\u5728\u6a21\u578b\u8bbe\u8ba1\u4e0a\u4f53\u73b0\u4e86\u663e\u8457\u7684\u666e\u9002\u6027\u7279\u5f81\uff0c\u91c7\u7528\u5355\u4e00\u7f51\u7edc\u67b6\u6784\u5904\u7406\u6240\u6709Atari\u6e38\u620f\u4efb\u52a1\uff0c\u4ec5\u9700\u8f93\u5165\u539f\u59cb\u50cf\u7d20\u3001\u52a8\u4f5c\u7a7a\u95f4\u548c\u751f\u547d\u503c\u7b49\u57fa\u672c\u5148\u9a8c\u77e5\u8bc6\u3002\u5728\u7b97\u6cd5\u5b9e\u73b0\u65b9\u9762\uff0c\u521b\u65b0\u6027\u5730\u5f15\u5165\u4e86\u7ecf\u9a8c\u56de\u653e\u673a\u5236\uff08experience replay\uff09\uff0c\u901a\u8fc7\u5faa\u73af\u7f13\u51b2\u533a\u5b58\u50a8\u5386\u53f2\u8f6c\u79fb\u6837\u672c<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"megnui6p24t5\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"megnuk5d194f\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"megnulwbkg4\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u5e76\u91c7\u7528\u5747\u5300\u968f\u673a\u91c7\u6837\u65b9\u5f0f\u62bd\u53d6\u5c0f\u6279\u91cf\uff08minibatch size=32\uff09\u8fdb\u884c\u8bad\u7ec3\u3002\u8fd9\u79cd\u8bbe\u8ba1\u6709\u6548\u6253\u7834\u4e86\u6570\u636e\u95f4\u7684\u65f6\u95f4\u76f8\u5173\u6027\uff0c\u663e\u8457\u63d0\u9ad8\u4e86\u6837\u672c\u5229\u7528\u7387\u548c\u8bad\u7ec3\u7a33\u5b9a\u6027\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728\u5956\u52b1\u51fd\u6570\u8bbe\u8ba1\u65b9\u9762\uff0c\u7814\u7a76\u8005\u91c7\u7528\u4e86\u5f52\u4e00\u5316\u5904\u7406\u7b56\u7565\uff0c\u5c06\u6b63\u5411\u5956\u52b1\u8bbe\u4e3a+1\uff0c\u8d1f\u5411\u5956\u52b1\u8bbe\u4e3a-1\uff0c\u5176\u4f59\u60c5\u51b5\u4e3a0\uff0c\u8fd9\u79cd\u6807\u51c6\u5316\u65b9\u6cd5\u6709\u6548\u63a7\u5236\u4e86\u8bef\u5dee\u8303\u56f4\u5e76\u5b9e\u73b0\u4e86\u8de8\u6e38\u620f\u7684\u7edf\u4e00\u8bad\u7ec3\u901f\u5ea6\u3002\u7ecf\u9a8c\u56de\u653e\u673a\u5236\u4e0e\u5956\u52b1\u5f52\u4e00\u5316\u7684\u534f\u540c\u4f5c\u7528\uff0c\u4f7f\u5f97\u7b97\u6cd5\u80fd\u591f\u5728\u4e0d\u540c\u6e38\u620f\u95f4\u4fdd\u6301\u4e00\u81f4\u7684\u6027\u80fd\u8868\u73b0\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u9488\u5bf9\u5927\u89c4\u6a21\u8bad\u7ec3\u6570\u636e\u7684\u9ad8\u5197\u4f59\u7279\u6027\uff0c\u7814\u7a76\u91c7\u7528\u4e86<\/span><\/span><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>RMSProp\u4f18\u5316\u7b97\u6cd5<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u5176\u6838\u5fc3\u673a\u5236\u662f\u901a\u8fc7\u5c06\u68af\u5ea6\u9664\u4ee5\u5176\u8fd1\u671f\u5e45\u5ea6\u7684\u6ed1\u52a8\u5e73\u5747\u503c\u6765\u8c03\u6574\u5b66\u4e60\u7387\u3002\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u5f15\u5165\u8870\u51cf\u7cfb\u6570<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03f5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u91c7\u7528\u03f5-greedy\u7b56\u7565\u8fdb\u884c\u63a2\u7d22-\u5229\u7528\u6743\u8861\uff1a\u5728\u524d1\u767e\u4e07\u8bad\u7ec3\u6b65\u4e2d\uff0c<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03f5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u503c\u4ece1\u7ebf\u6027\u8870\u51cf\u81f30.1\uff0c\u4e4b\u540e\u4fdd\u6301\u6052\u5b9a\u3002\u8fd9\u79cd\u52a8\u6001\u8c03\u6574\u7b56\u7565\u4e0e\u7ecf\u9a8c\u56de\u653e\u673a\u5236\u76f8\u7ed3\u5408\uff0c\u6709\u6548\u907f\u514d\u4e86\u8fc7\u65e9\u6536\u655b\u95ee\u9898\uff0c\u7279\u522b\u9002\u5408\u5904\u7406\u975e\u5e73\u7a33\u76ee\u6807\u51fd\u6570\u3002\u503c\u5f97\u6ce8\u610f\u7684\u662f\uff0c\u7ecf\u9a8c\u56de\u653e\u7f13\u51b2\u533a\u7684\u5bb9\u91cf\u8bbe\u7f6e\u4e3a1,000,000\u4e2a\u6837\u672c\uff0c\u5e76\u5728\u8bad\u7ec3\u524d\u9884\u586b\u514550,000\u5e27\u6570\u636e\u4ee5\u786e\u4fdd\u521d\u59cb\u91c7\u6837\u8d28\u91cf\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u63d0\u9ad8\u8ba1\u7b97\u6548\u7387\uff0c\u7814\u7a76\u8005\u5bf9\u6240\u6709\u6e38\u620f\u91c7\u7528\u4e86\u8df3\u5e27\u6280\u672f\uff08\u6bcf4\u5e27\u5904\u74061\u5e27\uff09\uff0c\u5728\u4fdd\u8bc1\u6027\u80fd\u65e0\u660e\u663e\u4e0b\u964d\u7684\u524d\u63d0\u4e0b\u663e\u8457\u63d0\u5347\u4e86\u8bad\u7ec3\u901f\u5ea6\u3002\u8fd9\u79cd\u65f6\u95f4\u62bd\u8c61\u65b9\u6cd5\u4e0e\u7ecf\u9a8c\u56de\u653e\u673a\u5236\u534f\u540c\u5de5\u4f5c\uff0c\u4f7f\u5f97\u6837\u672c\u590d\u6742\u5ea6\u76f8\u6bd4\u5728\u7ebf\u7b56\u7565\u964d\u4f4e\u4e86\u7ea610\u500d\u3002\u5b9e\u9a8c\u7ed3\u679c\u8868\u660e\uff0c\u79fb\u9664\u7ecf\u9a8c\u56de\u653e\u4f1a\u5bfc\u81f4\u6027\u80fd\u4e0b\u964d58.7%\uff0c\u5145\u5206\u9a8c\u8bc1\u4e86\u8be5\u673a\u5236\u7684\u5fc5\u8981\u6027\u3002\u8fd9\u4e9b\u521b\u65b0\u8bbe\u8ba1\u5171\u540c\u6784\u6210\u4e86DQN\u7b97\u6cd5\u7684\u6838\u5fc3\u6846\u67b6\uff0c\u4e3a\u540e\u7eed\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u7814\u7a76\u5960\u5b9a\u4e86\u91cd\u8981\u57fa\u7840\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">1.4.3 \u5177\u4f53\u7b97\u6cd5\u53ca\u5176\u8bad\u7ec3\u6d41\u7a0b<\/span><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"text-align: center;margin-bottom: 0px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"0.7802690582959642\" data-s=\"300,640\" data-type=\"jpeg\" data-w=\"892\" style=\"width: 372px;height: 290px\" data-imgfileid=\"100235191\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-3292dc3f51ddcecdcd49b0cfbf19fea2.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>\u7b97\u6cd5\u6d41\u7a0b\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\"font-size: 13px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[1]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"text-align: center;margin-left: 8px;margin-right: 8px;margin-bottom: 0px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"0.481\" data-s=\"300,640\" data-type=\"jpeg\" data-w=\"1000\" data-imgfileid=\"100235192\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-fb39c02556a096fb94513b060146833b.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 13px\"><span>\u7b97\u6cd5\u6d41\u7a0b\u793a\u610f\u56fe\uff0c\u5f15\u81ea<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>[1]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1. \u521d\u59cb\u5316\u9636\u6bb5<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u56de\u653e\u8bb0\u5fc6\u5e93(Replay Memory)\uff1a\u521b\u5efa\u5bb9\u91cf\u4e3a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>N<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7684\u7ecf\u9a8c\u5b58\u50a8\u5e93<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>D<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u7528\u4e8e\u7f13\u5b58\u5386\u53f2\u8f6c\u79fb\u6570\u636e\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u4f5c-\u4ef7\u503c\u51fd\u6570\u7f51\u7edc\uff1a<\/span><\/span><\/section>\n<\/li>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3b\u7f51\u7edc<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u968f\u673a\u521d\u59cb\u5316\u7f51\u7edc\u53c2\u6570<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u8d1f\u8d23\u5b9e\u65f6\u52a8\u4f5c\u9009\u62e9\u548c\u4ef7\u503c\u4f30\u8ba1\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u76ee\u6807\u7f51\u7edc<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmwxj71qvp\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u521d\u59cb\u53c2\u6570<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmxkdx1zcd\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u7528\u4e8e\u7a33\u5b9a\u5316\u8ba1\u7b97\u76ee\u6807Q\u503c\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8d85\u53c2\u6570\u8bbe\u5b9a\uff1a\u8bbe\u7f6e\u8bad\u7ec3\u603b\u56de\u5408\u6570M\u3001\u5355\u56de\u5408\u6700\u5927\u6b65\u6570T\u3001\u76ee\u6807\u7f51\u7edc\u540c\u6b65\u9891\u7387<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>C<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3001\u6298\u6263\u56e0\u5b50<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b3<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3001\u63a2\u7d22\u7387<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03f5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7b49\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<\/ul>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>2. \u56de\u5408\uff08Episode\uff09\u5faa\u73af \u5bf9\u6bcf\u4e2a\u56de\u5408episode=1,2,&#8230;,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>M<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6267\u884c\uff1a \u72b6\u6001\u9884\u5904\u7406\uff1a\u521d\u59cb\u5316\u73af\u5883\u89c2\u6d4b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>x<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmxxe1qng\" data-pm-slice=\"0 0 []\"><span><span>1<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,\u901a\u8fc7\u9884\u5904\u7406\u51fd\u6570<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u751f\u6210\u521d\u59cb\u72b6\u6001\u8868\u5f81<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmy16k1nlr\" data-pm-slice=\"0 0 []\"><span><span>1<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>=<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmy42jgdf\" data-pm-slice=\"0 0 []\"><span><span>1<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>3. \u65f6\u95f4\u6b65\uff08Timestep\uff09\u5faa\u73af \u5bf9\u6bcf\u4e2a\u65f6\u95f4\u6b65t=1,2,&#8230;,T\u6267\u884c\uff1a<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u4f5c\u9009\u62e9\uff1a<\/span><\/span><\/section>\n<\/li>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u63a2\u7d22\u7b56\u7565\uff1a\u4ee5\u6982\u7387\u03f5\u968f\u673a\u9009\u62e9\u52a8\u4f5c<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>t<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,\u4fc3\u8fdb\u73af\u5883\u63a2\u7d22\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5229\u7528\u7b56\u7565\uff1a\u5426\u5219\uff0c\u6839\u636e\u4e3b\u7f51\u7edc\u9009\u62e9\u6700\u4f18\u52a8\u4f5c\uff1a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmydiy1k13\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>=<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>g<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>m<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>x<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmykh9tak\" data-pm-slice=\"0 0 []\"><span><span>a<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmyrvm1x95\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><\/span><\/section>\n<\/li>\n<\/ul>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6267\u884c\u4e0e\u73af\u5883\u4ea4\u4e92\uff1a<\/span><\/span><\/section>\n<\/li>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6267\u884c\u52a8\u4f5ca<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmz1re1r8z\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u83b7\u53d6\u5956\u52b1r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmz9ar1ir4\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u548c\u4e0b\u4e00\u5e27\u56fe\u50cf<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>x<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u9884\u5904\u7406\u4e0b\u4e00\u72b6\u6001<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>=<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<\/ul>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5b58\u50a8\u8f6c\u79fb\u6570\u636e\uff1a\u5c06\u8f6c\u79fb\u5143\u7ec4<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmzskb1h6x\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmzvcp17kh\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejmzxt95vd\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5b58\u5165\u56de\u653e\u8bb0\u5fc6\u5e93<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>D<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7ecf\u9a8c\u56de\u653e\u4e0e\u7f51\u7edc\u66f4\u65b0\uff1a<\/span><\/span><\/section>\n<\/li>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u968f\u673a\u91c7\u6837\uff1a\u4ece<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>D<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e2d\u5747\u5300\u62bd\u53d6\u5c0f\u6279\u91cf\u8f6c\u79fb<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn08j116l7\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn0du017l0\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn0gtdcto\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>j<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u76ee\u6807<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u503c\u8ba1\u7b97\uff1a&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>y<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn0x621hex\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>=<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn27w61qpr\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>+<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b3<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>m<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>x<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn2akfjtu\" data-pm-slice=\"0 0 []\"><span><span>a<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn499owgr\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>j<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u68af\u5ea6\u4e0b\u964d:&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2207<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn2qtq282\" data-pm-slice=\"0 0 []\"><span><span>\u03b8<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\/<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>|<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>B<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>|<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2211<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>y<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn3nuc1gnh\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2212<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03d5<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn337m1zg0\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn36zi1lsm\" data-pm-slice=\"0 0 []\"><span><span>j<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn2z8y10r6\" data-pm-slice=\"0 0 []\"><span><span>2<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\uff0cB\u4e3abatch\u6570\u636e<\/span><\/span><\/span><\/section>\n<\/li>\n<\/ul>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u76ee\u6807\u7f51\u7edc\u540c\u6b65\uff1a\u6bcf\u9694<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>C<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6b65\u5c06\u4e3b\u7f51\u7edc\u53c2\u6570<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u590d\u5236\u81f3\u76ee\u6807\u7f51\u7edc<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn6h81pre\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u5373<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mejn6k7c1891\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2190<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/section>\n<\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h2 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h2>\n<h3 style=\", Arial, sans-serif;letter-spacing: 0.544px\">\n<section style=\"letter-spacing: 0.544px;text-align: right;font-size: 13px\">\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;text-align: center\">\n<section style=\"vertical-align: middle\">\n<section style=\"margin-bottom: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 1.4\">\n<p><strong><strong style=\"text-align: left;letter-spacing: 0.544px\"><span style=\", Arial, sans-serif\"><strong style=\"letter-spacing: 0.578px\"><span>2. Q-Learning \u57fa\u7840<\/span><\/strong><\/span><\/strong><\/strong><\/p>\n<\/section>\n<section style=\"margin-top: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/h3>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;letter-spacing: 0.578px;line-height: 1.75em\"><span><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.1 \u9a6c\u5c14\u53ef\u592b\u51b3\u7b56\u8fc7\u7a0b\uff08MDP\uff09\u7b80\u4ecb<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u9a6c\u5c14\u53ef\u592b\u51b3\u7b56\u8fc7\u7a0b\uff08Markov Decision Process\uff0c\u7b80\u79f0 MDP\uff09\u662f\u5f3a\u5316\u5b66\u4e60\u7684\u6838\u5fc3\u6570\u5b66\u6846\u67b6\uff0c\u7528\u4e8e\u5efa\u6a21\u667a\u80fd\u4f53\u5728\u4e0d\u786e\u5b9a\u73af\u5883\u4e2d\u901a\u8fc7\u8bd5\u9519\u5b66\u4e60\u6700\u4f18\u7b56\u7565\u7684\u8fc7\u7a0b\u3002\u5b83\u5728\u9a6c\u5c14\u53ef\u592b\u8fc7\u7a0b\u7684\u57fa\u7840\u4e0a\u5f15\u5165\u4e86\u201c\u52a8\u4f5c\u201d\u548c\u201c\u5956\u52b1\u201d\u673a\u5236\uff0c\u5e7f\u6cdb\u5e94\u7528\u4e8e\u4eba\u5de5\u667a\u80fd\u3001\u63a7\u5236\u7cfb\u7edf\u3001\u7ecf\u6d4e\u5b66\u7b49\u9886\u57df\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"text-align: center;margin-left: 8px;margin-right: 8px;margin-bottom: 0px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"0.43166666666666664\" data-s=\"300,640\" data-type=\"png\" data-w=\"600\" style=\"width:415px;height:179px\" data-imgfileid=\"100235288\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-5be3ae4edbfb849fb4a97cf1fb30820b.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 13px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mek2khnf1pt9\" data-pm-slice=\"0 0 []\"><span>\u9a6c\u5c14\u53ef\u592b\u51b3\u7b56\u8fc7\u7a0b<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.1.1 MDP \u7684\u6838\u5fc3\u601d\u60f3<\/span><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728 MDP \u4e2d\uff0c\u667a\u80fd\u4f53\u4e0e\u73af\u5883\u7684\u4ea4\u4e92\u8fc7\u7a0b\u5982\u53f3\u56fe\u6240\u793a\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(1)\u667a\u80fd\u4f53\u89c2\u5bdf\u5f53\u524d\u72b6\u6001<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku3ch817s4\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(2)\u6839\u636e\u7b56\u7565&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03c0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u9009\u62e9\u4e00\u4e2a\u52a8\u4f5c<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku3g3ovgk\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(3)\u73af\u5883\u6839\u636e\u72b6\u6001\u8f6c\u79fb\u6982\u7387<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>P<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\uff0c\u8f6c\u79fb\u5230\u4e0b\u4e00\u4e2a\u72b6\u6001&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u5e76\u7ed9\u4e88\u667a\u80fd\u4f53\u5956\u52b1&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku3nzj18j3\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(4)\u667a\u80fd\u4f53\u6839\u636e\u83b7\u5f97\u7684\u5956\u52b1\u548c\u65b0\u7684\u72b6\u6001\uff0c\u66f4\u65b0\u7b56\u7565&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03c0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u4ee5\u671f\u83b7\u5f97\u66f4\u9ad8\u7684\u7d2f\u8ba1\u5956\u52b1\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u4e00\u8fc7\u7a0b\u6301\u7eed\u8fdb\u884c\uff0c\u667a\u80fd\u4f53\u901a\u8fc7\u4e0d\u65ad\u4e0e\u73af\u5883\u4ea4\u4e92\uff0c\u5b66\u4e60\u6700\u4f18\u7b56\u7565\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.1.2 \u7b56\u7565\u4e0e\u4ef7\u503c\u51fd\u6570<\/span><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728MDP\u4e2d\uff0c\u7b56\u7565\u4e0e\u4ef7\u503c\u51fd\u6570\u662f\u5f3a\u5316\u5b66\u4e60\u7684\u6838\u5fc3\u6982\u5ff5\uff0c\u5b83\u4eec\u5171\u540c\u6784\u6210\u4e86\u667a\u80fd\u4f53\u5b66\u4e60\u4e0e\u51b3\u7b56\u7684\u7406\u8bba\u57fa\u7840\u3002\u4ee5\u4e0b\u662f\u5173\u4e8e\u7b56\u7565\u4e0e\u4ef7\u503c\u51fd\u6570\u7684\u5b9a\u4e49\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span data-pm-slice=\"0 0 []\"><span>&nbsp;\u2022&nbsp;<\/span><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7b56\u7565&nbsp;<\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03c0<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>|<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)\uff1a\u5728\u72b6\u6001 s\u4e0b\u9009\u62e9\u52a8\u4f5c a \u7684\u6982\u7387\u5206\u5e03\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span data-pm-slice=\"0 0 []\"><span>&nbsp;\u2022&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u72b6\u6001\u503c\u51fd\u6570<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>V<\/span><\/span><sub style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku5x6k1y\" data-pm-slice=\"0 0 []\"><span><span>\u03c0<\/span><\/span><\/sub><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)\uff1a\u5728\u7b56\u7565 \u03c0 \u4e0b\uff0c\u4ece\u72b6\u6001 s \u5f00\u59cb\uff0c\u671f\u671b\u83b7\u5f97\u7684\u7d2f\u8ba1\u5956\u52b1\u3002\u5176\u5b9a\u4e49\u4e3a\uff1a<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 15px\"><span><img class=\"rich_pages wxw-img\" data-ratio=\"0.13425925925925927\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"width: 264px;height: 35px\" data-imgfileid=\"100235308\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-3aa27254a08eee2fa8b0f6aad2a8472f.png\" \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5176\u4e2d<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b3<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2208<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u6298\u6263\u56e0\u5b50\uff0c\u63a7\u5236\u672a\u6765\u5956\u52b1\u7684\u6743\u91cd\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u4ece<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku7eqz1u1e\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5230<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u83b7\u5f97\u7684\u5373\u65f6\u5956\u52b1\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span data-pm-slice=\"0 0 []\"><span>&nbsp;\u2022&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u4f5c\u503c\u51fd\u6570&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sub style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku7uoldg1\" data-pm-slice=\"0 0 []\"><span><span>\u03c0<\/span><\/span><\/sub><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)\uff1a\u5728\u7b56\u7565 \u03c0 \u4e0b\uff0c\u4ece\u72b6\u6001 s \u5f00\u59cb\uff0c\u91c7\u53d6\u52a8\u4f5c a \u540e\uff0c\u671f\u671b\u83b7\u5f97\u7684\u7d2f\u8ba1\u5956\u52b1\u3002\u5176\u5b9a\u4e49\u4e3a\uff1a<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em;text-align: center\"><span style=\"font-size: 15px\"><span><img class=\"rich_pages wxw-img\" data-ratio=\"0.10092592592592593\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"width: 319px;height: 32px\" data-backw=\"304\" data-backh=\"31\" data-imgfileid=\"100235309\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-636fd0214ae7e4e84c44ec4f8b6cbc74.png\" \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u4e9b\u51fd\u6570\u7528\u4e8e\u8bc4\u4f30\u7b56\u7565\u7684\u4f18\u52a3\uff0c\u6307\u5bfc\u7b56\u7565\u7684\u6539\u8fdb\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.2 Q \u503c\u51fd\u6570\u7684\u5b9a\u4e49\u4e0e\u66f4\u65b0\u516c\u5f0f<\/span><\/span><\/span><\/h3>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 24px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.2.1 \u5b9a\u4e49<\/span><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q \u503c\u51fd\u6570&nbsp;<\/span><\/span><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u8868\u793a\u667a\u80fd\u4f53\u5728\u72b6\u6001&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e0b\u91c7\u53d6\u52a8\u4f5c&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u540e\uff0c\u9075\u5faa\u67d0\u4e00\u7b56\u7565\u6240\u80fd\u83b7\u5f97\u7684\u671f\u671b\u7d2f\u79ef\u5956\u52b1\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 24px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.2.2 \u66f4\u65b0\u516c\u5f0f<\/span><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 24px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q-Learning \u7b97\u6cd5\u4f7f\u7528\u4ee5\u4e0b\u66f4\u65b0\u516c\u5f0f\u6765\u8fed\u4ee3 Q \u503c\uff1a<\/span><\/span><\/p>\n<section style=\"text-align: center\"><img class=\"rich_pages wxw-img\" data-ratio=\"0.075\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"width:419px;height:31px\" data-imgfileid=\"100235310\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-c80233e894edc4519dce2b044140ad57.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5176\u4e2d\uff0c\u7b26\u53f7\u542b\u4e49\u5982\u4e0b\uff1a<\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku8vi81otc\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5f53\u524d\u72b6\u6001\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku90m91ntj\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5f53\u524d\u52a8\u4f5c\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"meku933s1zwy\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5373\u65f6\u5956\u52b1\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u6267\u884c\u52a8\u4f5c\u540e\u7684\u65b0\u72b6\u6001\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2208<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u5b66\u4e60\u7387\uff1b<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b3<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2208<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a\u6298\u6263\u56e0\u5b50\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6b64\u516c\u5f0f\u57fa\u4e8e\u8d1d\u5c14\u66fc\u65b9\u7a0b\u7684\u65f6\u5e8f\u5dee\u5206\uff08TD\uff09\u66f4\u65b0\u601d\u60f3\uff0c\u9010\u6b65\u8c03\u6574&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u503c\u51fd\u6570\u4ee5\u903c\u8fd1\u6700\u4f18\u7b56\u7565\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.3 \u03b5-greedy \u7b56\u7565\u4e0e\u63a2\u7d22-\u5229\u7528\u6743\u8861<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q-learning \u901a\u5e38\u9762\u4e34\u201c\u63a2\u7d22\uff08exploration\uff09\u201d\u4e0e\u201c\u5229\u7528\uff08exploitation\uff09\u201d\u4e4b\u95f4\u7684\u6743\u8861\u95ee\u9898\u3002\u4e3a\u4e86\u89e3\u51b3\u8fd9\u4e00\u95ee\u9898\uff0c\u901a\u5e38\u91c7\u7528 \u03b5-greedy \u7b56\u7565\u3002\u03b5-greedy \u7b56\u7565\u662f\u4e00\u79cd\u7b80\u5355\u800c\u6709\u6548\u7684\u52a8\u4f5c\u9009\u62e9\u7b56\u7565\uff0c\u65e8\u5728\u5e73\u8861\u63a2\u7d22\u4e0e\u5229\u7528\u3002<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5229\u7528\uff08Exploitation\uff09\uff1a\u4ee5 1\u2212\u03f5 \u7684\u6982\u7387\u9009\u62e9\u5f53\u524d\u72b6\u6001\u4e0b Q \u503c\u6700\u5927\u7684\u52a8\u4f5c\uff0c\u5373\u9009\u62e9\u5df2\u77e5\u7684\u6700\u4f73\u52a8\u4f5c\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u63a2\u7d22\uff08Exploration\uff09\uff1a\u4ee5 \u03f5 \u7684\u6982\u7387\u968f\u673a\u9009\u62e9\u4e00\u4e2a\u52a8\u4f5c\uff0c\u4ece\u800c\u63a2\u7d22\u65b0\u7684\u53ef\u80fd\u6027\u3002<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5176\u4e2d\uff0c\u03f5 \u662f\u4e00\u4e2a\u4ecb\u4e8e 0 \u548c 1 \u4e4b\u95f4\u7684\u53c2\u6570\uff0c\u63a7\u5236\u63a2\u7d22\u7684\u9891\u7387\u3002\u8f83\u5927\u7684 \u03f5 \u503c\u9f13\u52b1\u66f4\u591a\u7684\u63a2\u7d22\uff0c\u800c\u8f83\u5c0f\u7684 \u03f5 \u503c\u5219\u503e\u5411\u4e8e\u66f4\u591a\u7684\u5229\u7528\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728\u5b9e\u9645\u5e94\u7528\u4e2d\uff0c\u901a\u5e38\u4f1a\u968f\u7740\u8bad\u7ec3\u7684\u8fdb\u884c\u9010\u6b65\u51cf\u5c0f \u03f5 \u503c\uff0c\u4ece\u800c\u5b9e\u73b0\u4ee5\u4e0b\u76ee\u6807\uff1a<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u521d\u671f\u9636\u6bb5\uff1a\u8bbe\u7f6e\u8f83\u5927\u7684 \u03f5 \u503c\uff0c\u9f13\u52b1\u667a\u80fd\u4f53\u8fdb\u884c\u5145\u5206\u7684\u63a2\u7d22\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u540e\u671f\u9636\u6bb5\uff1a\u9010\u6b65\u51cf\u5c0f \u03f5 \u503c\uff0c\u589e\u52a0\u5229\u7528\u5df2\u77e5\u6700\u4f73\u7b56\u7565\u7684\u9891\u7387\u3002<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u79cd\u7b56\u7565\u6709\u52a9\u4e8e\u667a\u80fd\u4f53\u5728\u5b66\u4e60\u521d\u671f\u83b7\u53d6\u8db3\u591f\u7684\u7ecf\u9a8c\uff0c\u5728\u540e\u671f\u5219\u80fd\u591f\u7a33\u5b9a\u5730\u6267\u884c\u6700\u4f18\u7b56\u7565\u3002<\/span><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.4 Q-Learning \u7684\u6536\u655b\u6027<\/span><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q-Learning \u6536\u655b\u6027\u7684\u8bc1\u660e\u4e3b\u8981\u57fa\u4e8e\u4ee5\u4e0b\u51e0\u70b9\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09Bellman \u6700\u4f18\u7b97\u5b50\u662f\u538b\u7f29\u6620\u5c04<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[2]<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Bellman \u6700\u4f18\u7b97\u5b50 B \u5b9a\u4e49\u4e3a\uff1a<\/span><\/span><sub data-pm-slice=\"0 0 []\"><span><img alt=\"image.png\" class=\"rich_pages wxw-img\" data-ratio=\"0.15257352941176472\" data-type=\"png\" data-w=\"1088\" style=\"vertical-align: baseline;width: 181px\" width=\"181\" data-width=\"181px\" data-imgfileid=\"100235317\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-5f7242a02a9190576b86e220e24dfee5.png\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5b83\u6ee1\u8db3\uff1a&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2016<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>B<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel6lxjp1x37\" data-pm-slice=\"0 0 []\"><span><span>1<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2212<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>B<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel6lv631ugo\" data-pm-slice=\"0 0 []\"><span><span>2<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2016<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u221e<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2264<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b3<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2016<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel6m0ey3uy\" data-pm-slice=\"0 0 []\"><span><span>1<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2212<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel6m2a611q7\" data-pm-slice=\"0 0 []\"><span><span>2<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2016<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u221e<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u5373B\u662f\u4ee5\u6298\u6263\u56e0\u5b50\u03b3\u4e3a\u538b\u7f29\u7387\u7684\u538b\u7f29\u6620\u5c04\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09Banach \u4e0d\u52a8\u70b9\u5b9a\u7406\u4fdd\u8bc1\u552f\u4e00\u56fa\u5b9a\u70b9<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u56e0\u4e3aB\u662f\u538b\u7f29\u6620\u5c04\uff0c\u5b58\u5728\u552f\u4e00\u7684\u56fa\u5b9a\u70b9<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"memlf7bu1oct\" data-pm-slice=\"0 0 []\"><span><span>\u2217<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6ee1\u8db3\uff1a&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"memlf9c418lq\" data-pm-slice=\"0 0 []\"><span><span>\u2217<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>=<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>B<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"memlfb3gale\" data-pm-slice=\"0 0 []\"><span><span>\u2217<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u8fd9\u5c31\u662f\u6700\u4f18\u72b6\u6001-\u52a8\u4f5c\u503c\u51fd\u6570\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09\u968f\u673a\u903c\u8fd1\u6846\u67b6\u4e2d\u7684\u6536\u655b\u6761\u4ef6<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[3]<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q-Learning \u901a\u8fc7\u968f\u673a\u91c7\u6837\u548c\u8fed\u4ee3\u903c\u8fd1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"memlfdup73l\" data-pm-slice=\"0 0 []\"><span><span>\u2217<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u5728\u5b66\u4e60\u7387\u6ee1\u8db3\u4ee5\u4e0b\u6761\u4ef6\u65f6\u6536\u655b\uff1a<\/span><\/span><sub data-pm-slice=\"0 0 []\"><span><img alt=\"image.png\" class=\"rich_pages wxw-img\" data-ratio=\"0.1717171717171717\" data-type=\"png\" data-w=\"990\" style=\"vertical-align: baseline;width: 163px\" width=\"163\" data-width=\"163px\" data-imgfileid=\"100235318\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-679271c739bd966277c9d711c7890f93.png\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u540c\u65f6\uff0c\u7b97\u6cd5\u9700\u4fdd\u8bc1\u6bcf\u4e2a\u72b6\u6001-\u52a8\u4f5c\u5bf9 (s,a) \u88ab\u65e0\u9650\u6b21\u8bbf\u95ee\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6536\u655b\u7684\u5173\u952e\u6761\u4ef6\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5145\u5206\u63a2\u7d22\uff1a\u667a\u80fd\u4f53\u5fc5\u987b\u4fdd\u8bc1\u6240\u6709\u5bf9\u65e0\u9650\u6b21\u8bbf\u95ee\uff0c\u901a\u5e38\u901a\u8fc7 \u03b5-greedy \u7b49\u7b56\u7565\u5b9e\u73b0\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5b66\u4e60\u7387\u8870\u51cf\uff1a\u5b66\u4e60\u7387<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>t<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u968f\u65f6\u95f4\u8870\u51cf\uff0c\u4f46\u4e0d\u5b9c\u8fc7\u5feb\u3002\u6298\u6263\u56e0\u5b50\u9650\u5236\uff1a\u03b3\u2208[0,1)\uff0c\u4fdd\u8bc1\u672a\u6765\u5956\u52b1\u7684\u5f71\u54cd\u9012\u51cf\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728\u6ee1\u8db3\u9002\u5f53\u7684\u5b66\u4e60\u7387\u8c03\u8282\u3001\u5145\u5206\u63a2\u7d22\u3001\u4ee5\u53ca\u6298\u6263\u56e0\u5b50\u7ea6\u675f\u7684\u60c5\u51b5\u4e0b\uff0cQ-Learning \u7b97\u6cd5\u80fd\u591f\u4ee5\u6982\u7387 1 \u6536\u655b\u5230\u6700\u4f18\u503c\u51fd\u6570<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2217<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u5176\u6570\u5b66\u8868\u8fbe\u4e3a\uff1a<\/span><\/span><sub data-pm-slice=\"0 0 []\"><span><img alt=\"image.png\" class=\"rich_pages wxw-img\" data-ratio=\"0.147239263803681\" data-type=\"png\" data-w=\"978\" style=\"vertical-align: baseline;width: 131px\" width=\"131\" data-width=\"131px\" data-imgfileid=\"100235319\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-8f8336440345b76429f3734b33721b02.png\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u4e3a\u5f3a\u5316\u5b66\u4e60\u7b97\u6cd5\u7684\u7406\u8bba\u53ef\u9760\u6027\u63d0\u4f9b\u4e86\u575a\u5b9e\u57fa\u7840\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">2.5 Q-Learning \u7684\u5c40\u9650\u6027<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q-Learning \u5e7f\u6cdb\u5e94\u7528\u4e8e\u591a\u79cd\u51b3\u7b56\u4efb\u52a1\u3002\u5728\u5b9e\u9645\u5e94\u7528\u4e2d\uff0c\u5b83\u7684\u5c40\u9650\u6027\u4e3b\u8981\u4f53\u73b0\u5728\u4ee5\u4e0b\u51e0\u4e2a\u65b9\u9762\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09\u72b6\u6001-\u52a8\u4f5c\u7a7a\u95f4\u7ef4\u5ea6\u707e\u96be\uff08Curse of Dimensionality\uff09\uff1aQ-Learning \u4f7f\u7528 Q \u8868\u6765\u5b58\u50a8\u6bcf\u4e2a\u72b6\u6001-\u52a8\u4f5c\u5bf9\u7684\u4ef7\u503c\u3002\u5f53\u72b6\u6001\u6216\u52a8\u4f5c\u7a7a\u95f4\u975e\u5e38\u5927\u65f6\uff0cQ \u8868\u7684\u5c3a\u5bf8\u4f1a\u6025\u5267\u81a8\u80c0\uff0c\u5bfc\u81f4\u5b58\u50a8\u548c\u66f4\u65b0\u53d8\u5f97\u4e0d\u5207\u5b9e\u9645\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4f8b\u5982\uff0c\u5728\u5177\u6709\u6570\u767e\u4e07\u72b6\u6001\u548c\u52a8\u4f5c\u7684\u73af\u5883\u4e2d\uff0c\u4f20\u7edf\u7684 Q \u8868\u65b9\u6cd5\u53ef\u80fd\u65e0\u6cd5\u6709\u6548\u5904\u7406\u3002\u4e3a\u4e86\u89e3\u51b3\u8fd9\u4e2a\u95ee\u9898\uff0c\u901a\u5e38\u91c7\u7528\u51fd\u6570\u903c\u8fd1\u65b9\u6cd5\uff0c\u5982\u7ebf\u6027\u51fd\u6570\u903c\u8fd1\u6216\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\uff0c\u4ee5\u4f30\u8ba1 Q \u503c\uff0c\u4ece\u800c\u907f\u514d\u76f4\u63a5\u4f7f\u7528\u5e9e\u5927\u7684 Q \u8868\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09\u5728\u72b6\u6001\u548c\u52a8\u4f5c\u7a7a\u95f4\u8f83\u5927\u7684\u73af\u5883\u4e2d\uff0cQ-Learning \u7684\u5b66\u4e60\u8fc7\u7a0b\u53ef\u80fd\u975e\u5e38\u7f13\u6162\uff0c\u901a\u5e38\u9700\u8981\u5927\u91cf\u7684\u8bad\u7ec3\u56de\u5408\u624d\u80fd\u6536\u655b\u5230\u6700\u4f18\u7b56\u7565\u3002\u8fd9\u79cd\u6162\u6536\u655b\u6027\u4f7f\u5f97 Q-Learning \u5728\u9700\u8981\u5feb\u901f\u5b66\u4e60\u7684\u5e94\u7528\u573a\u666f\u4e2d\u53ef\u80fd\u4e0d\u592a\u9002\u7528\u3002[1]<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09\u63a2\u7d22\u4e0e\u5229\u7528\u7684\u5e73\u8861\u95ee\u9898\uff1aQ-Learning \u4f9d\u8d56\u4e8e\u63a2\u7d22\uff08exploration\uff09\u548c\u5229\u7528\uff08exploitation\uff09\u4e4b\u95f4\u7684\u5e73\u8861\u3002\u8fc7\u5ea6\u63a2\u7d22\u53ef\u80fd\u5bfc\u81f4\u5b66\u4e60\u6548\u7387\u4f4e\u4e0b\uff0c\u800c\u8fc7\u5ea6\u5229\u7528\u53ef\u80fd\u5bfc\u81f4\u9677\u5165\u5c40\u90e8\u6700\u4f18\u89e3\u3002\u4f8b\u5982\uff0c\u03b5-greedy \u7b56\u7565\u901a\u8fc7\u5f15\u5165\u968f\u673a\u6027\u6765\u5e73\u8861\u63a2\u7d22\u4e0e\u5229\u7528\uff0c\u4f46\u9009\u62e9\u5408\u9002\u7684 \u03b5 \u503c\u4ecd\u7136\u662f\u4e00\u4e2a\u6311\u6218\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff084\uff09\u5bf9\u8d85\u53c2\u6570\u654f\u611f\uff1aQ-Learning \u7684\u6027\u80fd\u5bf9\u5b66\u4e60\u7387\uff08\u03b1\uff09\u3001\u6298\u6263\u56e0\u5b50\uff08\u03b3\uff09\u548c\u63a2\u7d22\u7387\uff08\u03b5\uff09\u7b49\u8d85\u53c2\u6570\u975e\u5e38\u654f\u611f\u3002\u9009\u62e9\u4e0d\u5f53\u7684\u8d85\u53c2\u6570\u53ef\u80fd\u5bfc\u81f4\u5b66\u4e60\u8fc7\u7a0b\u4e0d\u7a33\u5b9a\u6216\u6536\u655b\u5230\u6b21\u4f18\u89e3\u3002\u4f8b\u5982\uff0c\u8fc7\u9ad8\u7684\u5b66\u4e60\u7387\u53ef\u80fd\u5bfc\u81f4 Q \u503c\u66f4\u65b0\u8fc7\u5feb\uff0c\u5bfc\u81f4\u9707\u8361\uff1b\u800c\u8fc7\u4f4e\u7684\u5b66\u4e60\u7387\u53ef\u80fd\u5bfc\u81f4\u5b66\u4e60\u8fc7\u7a0b\u8fc7\u6162\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff085\uff09\u5bf9\u51fd\u6570\u903c\u8fd1\u7684\u7a33\u5b9a\u6027\u95ee\u9898\uff1a\u5f53\u4f7f\u7528\u51fd\u6570\u903c\u8fd1\uff08\u5982\u795e\u7ecf\u7f51\u7edc\uff09\u6765\u4f30\u8ba1 Q \u503c\u65f6\uff0cQ-Learning \u53ef\u80fd\u51fa\u73b0\u4e0d\u7a33\u5b9a\u6216\u53d1\u6563\u7684\u60c5\u51b5\uff0c\u5c24\u5176\u662f\u5728\u975e\u7ebf\u6027\u51fd\u6570\u903c\u8fd1\u5668\u7684\u60c5\u51b5\u4e0b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u79cd\u4e0d\u7a33\u5b9a\u6027\u4e3b\u8981\u6e90\u4e8e\u4f30\u8ba1\u76ee\u6807\u503c\u4e0e\u5f53\u524d Q \u503c\u4e4b\u95f4\u7684\u76f8\u4e92\u4f9d\u8d56\u5173\u7cfb\u3002\u4e3a\u4e86\u89e3\u51b3\u8fd9\u4e2a\u95ee\u9898\uff0c\u63d0\u51fa\u4e86 Double Q-Learning \u7b49\u65b9\u6cd5\uff0c\u901a\u8fc7\u4f7f\u7528\u4e24\u4e2a\u72ec\u7acb\u7684 Q \u503c\u4f30\u8ba1\u5668\u6765\u51cf\u5c11\u8fc7\u4f30\u8ba1\u504f\u5dee\uff0c\u4ece\u800c\u63d0\u9ad8\u7a33\u5b9a\u6027\u3002[2]<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h2 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h2>\n<h3 style=\", Arial, sans-serif;letter-spacing: 0.544px\">\n<section style=\"letter-spacing: 0.544px;text-align: right;font-size: 13px\">\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;text-align: center\">\n<section style=\"vertical-align: middle\">\n<section style=\"margin-bottom: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 1.4\">\n<p><strong><strong style=\"text-align: left;letter-spacing: 0.544px\"><span style=\", Arial, sans-serif\"><strong style=\"letter-spacing: 0.578px\"><span>4. DQN \u7684\u6838\u5fc3\u601d\u60f3\u4e0e\u7ed3\u6784<\/span><\/strong><\/span><\/strong><\/strong><\/p>\n<\/section>\n<section style=\"margin-top: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/h3>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;letter-spacing: 0.578px;line-height: 1.75em\"><span><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">3.1 \u4f7f\u7528\u795e\u7ecf\u7f51\u7edc\u903c\u8fd1 Q \u503c\u51fd\u6570<\/span><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1kpn\" data-pm-slice=\"0 0 []\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>DQN\u7684<\/span><\/span><span style=\"color: #3f3f3f;font-size: 15px\"><span>\u2f8f\u4e3a\u503c\u51fd\u6570<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>&nbsp;\u5229\u2f64\u795e\u7ecf\u2f79\u7edc\u903c\u8fd1\uff0c\u5c5e\u4e8e\u2fae\u7ebf\u6027\u903c\u8fd1\u3002\u6b64\u5904\u7684\u503c\u51fd\u6570\u5bf9\u5e94\u7740\u2f00\u7ec4\u53c2\u6570\uff0c\u5728\u795e\u7ecf\u2f79\u7edc\u2fa5\u53c2\u6570\u662f\u6bcf\u5c42\u2f79\u7edc\u7684\u6743\u91cd\uff0c\u7528<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"color: #3f3f3f;font-size: 15px\"><span>\u03b8\u8868\u793a\u3002 \u7528\u516c\u5f0f\u8868\u793a\u7684\u8bdd\uff0c\u5982\u4e0b\uff1a<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1kpn\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"color: #3f3f3f;font-size: 15px\"><span><br \/><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm1kpn\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 15px\"><span><span>Q<\/span><\/span><\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2217<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2248<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmepk\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmepk\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5176\u4e2d\uff1a<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8f93\u5165\uff1a\u539f\u59cb\u72b6\u6001 s\uff08\u5982\u6e38\u620f\u753b\u9762\u50cf\u7d20\u77e9\u9635\uff09<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8f93\u51fa\uff1a\u6bcf\u4e2a\u52a8\u4f5c a \u5bf9\u5e94\u7684Q\u503c\uff08\u79bb\u6563\u52a8\u4f5c\u7a7a\u95f4\uff09<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u53c2\u6570\uff1a\u03b8 \u4e3a\u795e\u7ecf\u7f51\u7edc\u7684\u6743\u91cd\uff0c\u901a\u8fc7\u68af\u5ea6\u4e0b\u964d\u4f18\u5316<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1r94\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm1r94\"><span style=\"font-size: 15px\"><span><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.3225\" data-type=\"png\" data-w=\"400\" height=\"129\" style=\"vertical-align: middle\" width=\"400\" data-imgfileid=\"100235164\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-b60b8e14337027fb61a068ae88144e81.png\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm15ix\"><span style=\"font-size: 13px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-pm-slice=\"1 1 [&quot;para&quot;,{&quot;tagName&quot;:&quot;p&quot;,&quot;attributes&quot;:{&quot;style&quot;:&quot;margin-left: 8px; margin-right: 8px; margin-bottom: 0px; line-height: 1.75em;&quot;,&quot;data-mpa-action-id&quot;:&quot;mel6pxjm15ix&quot;},&quot;namespaceURI&quot;:&quot;http:\/\/www.w3.org\/1999\/xhtml&quot;}]\" data-mpa-action-id=\"mel6sc8u11up\"><span>\u7f51\u7edc\u5177\u4f53\u7ed3\u6784<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1r94\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1r94\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728\u8bba\u6587<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[1]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e2dDQN\u6240\u7528\u7684\u7f51\u7edc\u7ed3\u6784\u662f\u4e09\u4e2a\u5377\u79ef\u5c42\u52a0\u4e24\u4e2a\u5168\u8fde\u63a5\u5c42\uff0c\u7f51\u7edc\u7684\u8f93\u5165\u662f\u7ecf\u8fc7\u9884\u5904\u7406\u540e\u7684\u6570\u636e\uff0c\u9884\u5904\u7406\u6307\u7684\u662f\u5c06210*160\u7684\u6e38\u620f\u56fe\u50cf\u8f6c\u5316\u4e3a84*84\u7684\u56fe\u50cf\u7b49\u64cd\u4f5c\uff0c\u5f97\u5230\u7b97\u6cd5\u7ed3\u6784\u4e2d\u7684\u5177\u4f53\u4ee3\u7801\u5b9e\u73b0\u548c\u7f51\u7edc\u7ed3\u6784\u89c1\u56fe\u548c\u4ee5\u4e0b\u4ee3\u7801\uff1a<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1r94\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<section class=\"code-snippet__fix code-snippet__js\">\n<ul class=\"code-snippet__line-index code-snippet__js\">\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<\/ul>\n<pre class=\"code-snippet__js\" data-lang=\"apache\"><code><span><span class=\"code-snippet__comment\"># \u9884\u5904\u7406\u56fe\u50cf<\/span><\/span><\/code><code><span><span class=\"code-snippet__attribute\">def<\/span>&nbsp;preprocess(frame):<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u8f6c\u7070\u5ea6\u56fe<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">frame<\/span>&nbsp;= cv2.cvtColor(frame, cv2.COLOR_RGB2GRAY)<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u8c03\u6574\u5927\u5c0f<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">frame<\/span>&nbsp;= cv2.resize(frame, (<span class=\"code-snippet__number\">84<\/span>,&nbsp;<span class=\"code-snippet__number\">84<\/span>))<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u5f52\u4e00\u5316<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">frame<\/span>&nbsp;= frame.astype(np.float32) \/&nbsp;<span class=\"code-snippet__number\">255<\/span>.<span class=\"code-snippet__number\">0<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">return<\/span>&nbsp;frame<\/span><\/code><code><span><span class=\"code-snippet__comment\"># Q-Network (CNN)<\/span><\/span><\/code><code><span><span class=\"code-snippet__attribute\">class<\/span>&nbsp;DQN(nn.Module):<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">def<\/span>&nbsp;__init__(self, action_dim):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">super<\/span>(DQN, self).__init__()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">self<\/span>.conv1 = nn.Conv2d(<span class=\"code-snippet__number\">4<\/span>,&nbsp;<span class=\"code-snippet__number\">32<\/span>, kernel_size=<span class=\"code-snippet__number\">8<\/span>, stride=<span class=\"code-snippet__number\">4<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">self<\/span>.conv2 = nn.Conv2d(<span class=\"code-snippet__number\">32<\/span>,&nbsp;<span class=\"code-snippet__number\">64<\/span>, kernel_size=<span class=\"code-snippet__number\">4<\/span>, stride=<span class=\"code-snippet__number\">2<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">self<\/span>.conv3 = nn.Conv2d(<span class=\"code-snippet__number\">64<\/span>,&nbsp;<span class=\"code-snippet__number\">64<\/span>, kernel_size=<span class=\"code-snippet__number\">3<\/span>, stride=<span class=\"code-snippet__number\">1<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">self<\/span>.fc1 = nn.Linear(<span class=\"code-snippet__number\">64<\/span>&nbsp;*&nbsp;<span class=\"code-snippet__number\">7<\/span>&nbsp;*&nbsp;<span class=\"code-snippet__number\">7<\/span>,&nbsp;<span class=\"code-snippet__number\">512<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">self<\/span>.fc2 = nn.Linear(<span class=\"code-snippet__number\">512<\/span>, action_dim)<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">def<\/span>&nbsp;forward(self, x):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">x<\/span>&nbsp;= F.relu(self.conv1(x))<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">x<\/span>&nbsp;= F.relu(self.conv2(x))<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">x<\/span>&nbsp;= F.relu(self.conv3(x))<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">x<\/span>&nbsp;= torch.flatten(x, start_dim=<span class=\"code-snippet__number\">1<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__attribute\">x<\/span>&nbsp;= F.relu(self.fc1(x))<\/span><\/code><\/pre>\n<\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1r94\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmmqi\"><span style=\"font-size: 15px\"><b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6838\u5fc3\u610f\u4e49<\/span><\/span><\/b><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff1a<\/span><\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7aef\u5230\u7aef\u5b66\u4e60\uff1a\u76f4\u63a5\u4ece\u539f\u59cb\u72b6\u6001\uff08\u5982\u50cf\u7d20\uff09\u6620\u5c04\u5230\u52a8\u4f5c\u4ef7\u503c\uff0c\u65e0\u9700\u624b\u5de5\u8bbe\u8ba1\u7279\u5f81\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6cdb\u5316\u80fd\u529b\uff1a\u76f8\u4f3c\u72b6\u6001\u5171\u4eab\u795e\u7ecf\u7f51\u7edc\u7684\u7279\u5f81\u8868\u793a\uff0c\u63d0\u5347\u6837\u672c\u5229\u7528\u7387\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u9ad8\u7ef4\u5904\u7406\uff1a\u5377\u79ef\u795e\u7ecf\u7f51\u7edc\uff08CNN\uff09\u53ef\u9ad8\u6548\u63d0\u53d6\u56fe\u50cf\u4e2d\u7684\u7a7a\u95f4\u7279\u5f81\u3002<\/span><\/span><\/span><\/li>\n<\/ul>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm243o\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm243o\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">3.2 \u7ecf\u9a8c\u56de\u653e\uff08Experience Replay\uff09\u673a\u5236<\/span><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1kgz\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1kgz\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u901a\u8fc7\u7ecf\u9a8c\u56de\u653e\u53ef\u4ee5\u4ee4\u795e\u7ecf\u7f51\u7edc\u7684\u8bad\u7ec3\u6536\u655b\u4e14\u7a33\u5b9a\u3002\u8fd9\u662f\u56e0\u4e3a\u8bad\u7ec3\u795e\u7ecf\u2f79\u7edc\u65f6\uff0c\u5b58\u5728\u7684\u5047\u8bbe\u662f\u8bad\u7ec3\u6570\u636e\u662f\u72ec\u2f74\u540c\u5206\u5e03\u7684\uff0c\u4f46\u662f\u901a\u8fc7\u5f3a\u5316\u5b66\u4e60\u91c7\u96c6\u7684\u6570\u636e\u4e4b\u95f4\u5b58\u5728\u7740\u5173\u8054\u6027\uff0c\u5229\u2f64\u8fd9\u4e9b\u6570\u636e\u8fdb\u2f8f\u987a\u5e8f\u8bad\u7ec3\uff0c\u795e\u7ecf\u2f79\u7edc\u5f53\u7136\u4e0d\u7a33\u5b9a\u3002\u7ecf\u9a8c\u56de\u653e\u53ef\u4ee5\u6253\u7834\u6570\u636e\u95f4\u7684\u5173\u8054\u3002\u5728\u5f3a\u5316\u5b66\u4e60\u8fc7\u7a0b\u4e2d\uff0c\u667a\u80fd\u4f53\u5c06\u6570\u636e\u5b58\u50a8\u5230\u2f00\u4e2a\u6570\u636e\u5e93\u4e2d\uff0c\u518d\u5229\u2f64\u5747\u5300\u968f\u673a\u91c7\u6837\u7684\u2f45\u6cd5\u4ece\u6570\u636e\u5e93\u4e2d\u62bd\u53d6\u6570\u636e\uff0c\u7136\u540e\u5229\u2f64\u62bd\u53d6\u7684\u6570\u636e\u8bad\u7ec3\u795e\u7ecf\u2f79\u7edc\u3002 \u8fd9\u79cd\u7ecf\u9a8c\u56de\u653e\u7684\u6280\u5de7\u53ef\u4ee5\u6253\u7834\u6570\u636e\u4e4b\u95f4\u7684\u5173\u8054\u6027\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1kgz\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-align: center\" data-mpa-action-id=\"mel6pxjm1ews\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"1.27\" data-type=\"jpeg\" data-w=\"300\" height=\"381\" style=\"vertical-align: middle\" width=\"300\" data-imgfileid=\"100235162\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-5145be0f2a194b6507c24964f5287727.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjmo3h\"><span style=\"font-size: 13px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel6ugnc1jtj\" data-pm-slice=\"0 0 []\"><span>\u7ecf\u9a8c\u56de\u6536<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm140o\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4ee3\u7801\u5b9e\u73b0\u53ef\u53c2\u8003\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm140o\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section class=\"code-snippet__fix code-snippet__js\">\n<ul class=\"code-snippet__line-index code-snippet__js\">\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<\/ul>\n<pre class=\"code-snippet__js\" data-lang=\"ruby\"><code><span><span class=\"code-snippet__comment\"># \u7ecf\u9a8c\u56de\u653e<\/span><\/span><\/code><code><span><span class=\"code-snippet__keyword\">class<\/span>&nbsp;<span class=\"code-snippet__title\">ReplayMemory<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">__init__<\/span>(<span class=\"code-snippet__params\"><span class=\"code-snippet__variable\">self<\/span><\/span><span class=\"code-snippet__params\">, capacity<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__variable\">self<\/span>.memory = deque(maxlen=capacity)<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">push<\/span>(<span class=\"code-snippet__params\"><span class=\"code-snippet__variable\">self<\/span><\/span><span class=\"code-snippet__params\">, state, action, reward, next_state, done<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__variable\">self<\/span>.memory.append((state, action, reward, next_state, done))<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">sample<\/span>(<span class=\"code-snippet__params\"><span class=\"code-snippet__variable\">self<\/span><\/span><span class=\"code-snippet__params\">, batch_size<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span>&nbsp;random.sample(<span class=\"code-snippet__variable\">self<\/span>.memory, batch_size)<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">__len__<\/span>(<span class=\"code-snippet__params\"><span class=\"code-snippet__variable\">self<\/span><\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span>&nbsp;len(<span class=\"code-snippet__variable\">self<\/span>.memory)<\/span><\/code><\/pre>\n<\/section>\n<pre style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmh6e\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/pre>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmwol\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">3.3 \u76ee\u6807\u7f51\u7edc\uff08Target Network\uff09\u7684\u5f15\u5165\u4e0e\u53c2\u6570\u66f4\u65b0\u7b56\u7565<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmwol\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmq1f\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u4e86\u66f4\u957f\u8fdc\u7684\u63d0\u9ad8\u7a33\u5b9a\u6027\uff0c\u4f7f\u7528\u4e00\u4e2a\u72ec\u7acb\u7684\u795e\u7ecfQ\u7f51\u7edc\u53bb\u5f97\u5230target y\uff0c\u5373\u5efa\u7acb\u53e6\u4e00\u4e2a\u72ec\u7acb\u7684\u795e\u7ecf\u7f51\u7edctarget network\u3002\u6bcf\u7ecf\u8fc7c\u6b21\u66f4\u65b0\u540e\uff0c\u590d\u5236 network Q\u5f97\u5230target network Q\u2019\uff0c\u7136\u540e\u4f7f\u7528Q\u2019\u53bb\u751f\u6210target y\u5e94\u7528\u4e0e\u63a5\u4e0b\u6765\u7684c\u6b21\u66f4\u65b0\u3002\u597d\u5904\u5c31\u662f\u6bd4\u8d77online Q-learning\u7b97\u6cd5\u66f4\u7a33\u5b9a\u3002\u56e0\u4e3aonline Q-learning\u6bcf\u6b21\u66f4\u65b0\u5728\u589e\u52a0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7684\u540c\u65f6\u4e5f\u589e\u52a0\u4e86\u9488\u5bf9\u6bcf\u4e2aa\u7684<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u4ece\u800c\u589e\u52a0\u4e86 target y\uff0c\u8fd9\u53c8\u53ef\u80fd\u4f1a\u5f15\u8d77\u7b56\u7565\u7684\u9707\u8361\u751a\u81f3\u53d1\u6563\u3002\u6240\u4ee5\u76ee\u6807\u7f51\u7edc\uff08Target Network\uff09\u7684\u5f15\u5165\u53ef\u4ee5\u89e3\u51b3\u8fd9\u4e00\u95ee\u9898\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm16w4\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e8e\u662f\uff0c<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm16w4\"><span data-pm-slice=\"0 0 []\"><span>&nbsp;\u2022&nbsp;<\/span><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u635f\u5931\u51fd\u6570\u8868\u793a\u4e3a\uff08\u5ffd\u7565\u65e0\u5173\u7684\u65b9\u5dee\u9879\uff09<\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm16w4\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm16w4\"><span style=\"font-size: 15px\"><span><img class=\"rich_pages wxw-img\" data-ratio=\"0.05555555555555555\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"width: 350px;height: 20px\" data-imgfileid=\"100235320\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-05a2b8450b017d512b04bbd21104cd89.png\" \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm16w4\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<section style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px\"><span style=\"font-size: 15px\"><span data-pm-slice=\"0 0 []\"><span>&nbsp;\u2022&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u68af\u5ea6\u4e3a<\/span><\/span><\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-align: center\"><span style=\"font-size: 15px\"><span><img class=\"rich_pages wxw-img\" data-ratio=\"0.04351851851851852\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"width: 502px;height: 22px\" data-imgfileid=\"100235321\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-6d957a8190658ca3ccf430b6d94db199.png\" \/><\/span><\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5de5\u7a0b\u4e2d\uff0c\u4f7f\u7528\u968f\u673a\u68af\u5ea6\u4e0b\u964d\u65b9\u6cd5\u6765\u5b8c\u6210\u4f18\u5316\uff0c\u53e6\u5916\u5f53\u4ee4<\/span><\/span><sub data-pm-slice=\"0 0 []\"><span><img alt=\"image.png\" class=\"rich_pages wxw-img\" data-ratio=\"0.29069767441860467\" data-type=\"png\" data-w=\"344\" style=\"vertical-align: baseline;width: 75px\" width=\"75\" data-width=\"75px\" data-imgfileid=\"100235322\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-b4fc7b3b0a79e19aa5b3ca23fe18c8f0.png\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u65f6\uff0c\u9000\u5316\u4e3a\u539f\u59cb\u7684 Q-Learning \u66f4\u65b0\u5f62\u5f0f\u3002<\/span><\/span><\/span><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm232c\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN\u7684\u8bad\u7ec3\u4e0e\u53c2\u6570\u66f4\u65b0\u7b56\u7565\u53ef\u90e8\u5206\u53c2\u8003\u4ee5\u4e0b\u4ee3\u7801\u5b9e\u73b0\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm232c\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section class=\"code-snippet__fix code-snippet__js\">\n<ul class=\"code-snippet__line-index code-snippet__js\">\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<\/ul>\n<pre class=\"code-snippet__js\" data-lang=\"python\"><code><span><span class=\"code-snippet__comment\"># DQN Agent<\/span><\/span><\/code><code><span><span class=\"code-snippet__keyword\">class<\/span>&nbsp;<span class=\"code-snippet__title\">DQNAgent<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">__init__<\/span>(<span class=\"code-snippet__params\">self, action_dim<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.action_dim = action_dim<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.memory = ReplayMemory(<span class=\"code-snippet__number\">10000<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.policy_net = DQN(action_dim).to(device)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.target_net = DQN(action_dim).to(device)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.target_net.load_state_dict(self.policy_net.state_dict())<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.optimizer = optim.Adam(self.policy_net.parameters(), lr=<span class=\"code-snippet__number\">0.0001<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.exploration_rate =&nbsp;<span class=\"code-snippet__number\">1.0<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.steps_done =&nbsp;<span class=\"code-snippet__number\">0<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">select_action<\/span>(<span class=\"code-snippet__params\">self, state<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u03f5-\u8d2a\u5fc3\u7b56\u7565<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">if<\/span>&nbsp;random.random() &lt; self.exploration_rate:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span>&nbsp;random.randrange(self.action_dim)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">else<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">with<\/span>&nbsp;torch.no_grad():<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span>&nbsp;self.policy_net(state).argmax().item()<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">train<\/span>(<span class=\"code-snippet__params\">self<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u6837\u672c\u4e0d\u8db3\u65f6\u76f4\u63a5\u8fd4\u56de<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">if<\/span>&nbsp;<span class=\"code-snippet__built_in\">len<\/span>(self.memory) &lt;&nbsp;<span class=\"code-snippet__number\">64<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u4ece\u7ecf\u9a8c\u56de\u653e\u4e2d\u91c7\u6837<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; batch = self.memory.sample(<span class=\"code-snippet__number\">64<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; states, actions, rewards, next_states, dones =&nbsp;<span class=\"code-snippet__built_in\">zip<\/span>(*batch)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u8f6c\u4e3a\u5f20\u91cf\uff0c\u5e76\u53bb\u9664\u591a\u4f59\u7ef4\u5ea6<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; states = torch.tensor(np.array(states), dtype=torch.float32).to(device) &nbsp;<span class=\"code-snippet__comment\"># shape: (64, 1, 4, 84, 84)<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; states = states.squeeze(<span class=\"code-snippet__number\">1<\/span>) &nbsp;<span class=\"code-snippet__comment\"># shape: (64, 4, 84, 84)<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; actions = torch.tensor(actions, dtype=torch.int64).unsqueeze(<span class=\"code-snippet__number\">1<\/span>).to(device) &nbsp;<span class=\"code-snippet__comment\"># shape: (64, 1)<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; rewards = torch.tensor(rewards, dtype=torch.float32).to(device) &nbsp;<span class=\"code-snippet__comment\"># shape: (64,)<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; next_states = torch.tensor(np.array(next_states), dtype=torch.float32).to(device) &nbsp;<span class=\"code-snippet__comment\"># shape: (64, 1, 4, 84, 84)<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; next_states = next_states.squeeze(<span class=\"code-snippet__number\">1<\/span>) &nbsp;<span class=\"code-snippet__comment\"># shape: (64, 4, 84, 84)<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; dones = torch.tensor(dones, dtype=torch.<span class=\"code-snippet__built_in\">bool<\/span>).to(device) &nbsp;<span class=\"code-snippet__comment\"># shape: (64,)<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u8ba1\u7b97\u5f53\u524d Q \u503c<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; q_values = self.policy_net(states).gather(<span class=\"code-snippet__number\">1<\/span>, actions).squeeze()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u8ba1\u7b97\u4e0b\u4e00\u65f6\u523b\u6700\u5927 Q \u503c<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; next_q_values = self.target_net(next_states).<span class=\"code-snippet__built_in\">max<\/span>(<span class=\"code-snippet__number\">1<\/span>)[<span class=\"code-snippet__number\">0<\/span>].detach()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u8ba1\u7b97\u76ee\u6807 Q \u503c<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; target_q_values = rewards + (<span class=\"code-snippet__number\">0.99<\/span>&nbsp;* next_q_values * ~dones)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u4f18\u5316<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; loss = F.mse_loss(q_values, target_q_values)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.optimizer.zero_grad()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; loss.backward()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.optimizer.step()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u66f4\u65b0\u63a2\u7d22\u7387<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">if<\/span>&nbsp;self.exploration_rate &gt;&nbsp;<span class=\"code-snippet__number\">0.01<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; self.exploration_rate *=&nbsp;<span class=\"code-snippet__number\">0.995<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">update_target_net<\/span>(<span class=\"code-snippet__params\">self<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.target_net.load_state_dict(self.policy_net.state_dict())<\/span><\/code><code><span><span class=\"code-snippet__comment\"># \u8bad\u7ec3\u5faa\u73af<\/span><\/span><\/code><code><span>&nbsp; &nbsp;...<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__comment\"># \u5b9a\u671f\u66f4\u65b0\u76ee\u6807\u7f51\u7edc<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">if<\/span>&nbsp;episode %&nbsp;<span class=\"code-snippet__number\">10<\/span>&nbsp;==&nbsp;<span class=\"code-snippet__number\">0<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; agent.update_target_net()<\/span><\/code><code><span>&nbsp; &nbsp;...<\/span><\/code><\/pre>\n<\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm232c\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h2 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm100y\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h2>\n<h3 style=\", Arial, sans-serif;letter-spacing: 0.544px\">\n<section style=\"letter-spacing: 0.544px;text-align: right;font-size: 13px\">\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;text-align: center\">\n<section style=\"vertical-align: middle\">\n<section style=\"margin-bottom: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 1.4\">\n<p><strong><strong style=\"text-align: left;letter-spacing: 0.544px\"><span style=\", Arial, sans-serif\"><strong style=\"letter-spacing: 0.578px\"><span>4. DQN\u5728pytorch\u4e2d\u7684\u7b80\u5355\u5b8c\u6574\u5b9e\u73b0<\/span><\/strong><\/span><\/strong><\/strong><\/p>\n<\/section>\n<section style=\"margin-top: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/h3>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;letter-spacing: 0.578px;line-height: 1.75em\"><span><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1q7z\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8be5\u4ee3\u7801\u57fa\u4e8e\u6df1\u5ea6Q\u7f51\u7edc\uff08DQN\uff09\u7b97\u6cd5\uff0c\u662f\u4e00\u4e2a\u7b80\u5355\u7684\u4f7f\u7528DQN\u89e3\u51b3OpenAI Gym\u4e2d\u7684\u7ecf\u5178\u63a7\u5236\u4efb\u52a1CartPole-v1\u7684\u5b8c\u6574\u4f8b\u5b50\u3002\u4efb\u52a1\u76ee\u6807\u662f\u63a7\u5236\u5c0f\u8f66\u5de6\u53f3\u79fb\u52a8\uff0c\u4f7f\u7ad6\u76f4\u6746\u5b50\u5c3d\u53ef\u80fd\u957f\u65f6\u95f4\u4fdd\u6301\u76f4\u7acb\u3002\u667a\u80fd\u4f53\u901a\u8fc74\u7ef4\u72b6\u6001\uff08\u5c0f\u8f66\u4f4d\u7f6e\u3001\u901f\u5ea6\u3001\u6746\u5b50\u89d2\u5ea6\u53ca\u89d2\u901f\u5ea6\uff09\u611f\u77e5\u73af\u5883\uff0c\u8f93\u51fa\u79bb\u6563\u52a8\u4f5c\uff08\u5de6\u79fb\/\u53f3\u79fb\uff09\uff0c\u6700\u7ec8\u5b9e\u73b0\u7a33\u5b9a\u5e73\u8861\u8d85\u8fc7500\u6b65\u7684\u6ee1\u5206\u8868\u73b0\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1q7z\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-align: center\" data-mpa-action-id=\"mel6pxjm1k70\" data-pm-slice=\"1 2 []\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.6366666666666667\" data-type=\"jpeg\" data-w=\"300\" height=\"191\" style=\"vertical-align: middle\" width=\"300\" data-imgfileid=\"100235166\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-40eb7c73effbd907c45cf2e85eaac6e9.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjmsq\"><span style=\"font-size: 13px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel719j3ix0\" data-pm-slice=\"0 0 []\"><span>CartPole-v1<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm3kd\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7b97\u6cd5\u5b9e\u73b0Q\u503c\u7f51\u7edc\uff1a \u4f7f\u7528\u4e09\u5c42\u5168\u8fde\u63a5\u795e\u7ecf\u7f51\u7edc\uff08\u8f93\u51654\u7ef4\u2192128\u2192128\u2192\u8f93\u51fa2\u7ef4\uff09\u8fd1\u4f3cQ\u503c\u51fd\u6570\uff0c\u8f93\u51fa\u5de6\u53f3\u79fb\u52a8\u7684\u52a8\u4f5c\u4ef7\u503c\u3002 \u76ee\u6807\u7f51\u7edc\u4e0e\u4e3b\u7f51\u7edc\u5206\u79bb\uff0c\u5b9a\u671f\u540c\u6b65\u53c2\u6570\u4ee5\u7a33\u5b9a\u8bad\u7ec3\u3002\u7ecf\u9a8c\u56de\u653e\uff1a \u5b58\u50a810,000\u6761\u5386\u53f2\u8f6c\u79fb\u6837\u672c\uff08\u72b6\u6001\u3001\u52a8\u4f5c\u3001\u5956\u52b1\u3001\u4e0b\u4e00\u72b6\u6001\u3001\u7ec8\u6b62\u6807\u5fd7\uff09\uff0c\u8bad\u7ec3\u65f6\u968f\u673a\u91c7\u683764\u6761\u6570\u636e\u6253\u7834\u65f6\u5e8f\u76f8\u5173\u6027\u3002\u8bad\u7ec3\u673a\u5236\uff1a \u03b5-\u8d2a\u5a6a\u7b56\u7565\u52a8\u6001\u8870\u51cf\uff08\u521d\u59cb\u03b5=1.0\uff0c\u8870\u51cf\u73870.995\uff0c\u6700\u4f4e\u03b5=0.01\uff09\uff0c\u5e73\u8861\u63a2\u7d22\u4e0e\u5229\u7528\u3002 \u57fa\u4e8e\u8d1d\u5c14\u66fc\u65b9\u7a0b\u8ba1\u7b97\u76ee\u6807Q\u503c\uff0c\u901a\u8fc7\u5747\u65b9\u8bef\u5dee\u635f\u5931\u66f4\u65b0\u7f51\u7edc\uff0c\u6298\u6263\u56e0\u5b50\u03b3=0.99\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm3kd\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section class=\"code-snippet__fix code-snippet__js\">\n<ul class=\"code-snippet__line-index code-snippet__js\">\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<li><\/li>\n<\/ul>\n<pre class=\"code-snippet__js\" data-lang=\"python\"><code><span><span class=\"code-snippet__keyword\">import<\/span>&nbsp;torch<\/span><\/code><code><span><span class=\"code-snippet__keyword\">import<\/span>&nbsp;torch.nn&nbsp;<span class=\"code-snippet__keyword\">as<\/span>&nbsp;nn<\/span><\/code><code><span><span class=\"code-snippet__keyword\">import<\/span>&nbsp;torch.optim&nbsp;<span class=\"code-snippet__keyword\">as<\/span>&nbsp;optim<\/span><\/code><code><span><span class=\"code-snippet__keyword\">import<\/span>&nbsp;random<\/span><\/code><code><span><span class=\"code-snippet__keyword\">from<\/span>&nbsp;collections&nbsp;<span class=\"code-snippet__keyword\">import<\/span>&nbsp;deque<\/span><\/code><code><span><span class=\"code-snippet__keyword\">import<\/span>&nbsp;gym<\/span><\/code><code><span><span class=\"code-snippet__comment\"># \u5b9a\u4e49Q\u7f51\u7edc<\/span><\/span><\/code><code><span><span class=\"code-snippet__keyword\">class<\/span>&nbsp;<span class=\"code-snippet__title\">QNetwork<\/span>(nn.Module):<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">__init__<\/span>(<span class=\"code-snippet__params\">self, input_dim, output_dim<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__built_in\">super<\/span>(QNetwork, self).__init__()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.fc = nn.Sequential(<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; nn.Linear(input_dim,&nbsp;<span class=\"code-snippet__number\">128<\/span>),<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; nn.ReLU(),<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; nn.Linear(<span class=\"code-snippet__number\">128<\/span>,&nbsp;<span class=\"code-snippet__number\">128<\/span>),<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; nn.ReLU(),<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; nn.Linear(<span class=\"code-snippet__number\">128<\/span>, output_dim)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; )<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">forward<\/span>(<span class=\"code-snippet__params\">self, x<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span>&nbsp;self.fc(x)<\/span><\/code><code><span><span class=\"code-snippet__comment\"># \u5b9a\u4e49DQN\u4ee3\u7406<\/span><\/span><\/code><code><span><span class=\"code-snippet__keyword\">class<\/span>&nbsp;<span class=\"code-snippet__title\">DQNAgent<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">__init__<\/span>(<span class=\"code-snippet__params\">self, state_dim, action_dim, lr=<\/span><span class=\"code-snippet__params\"><span class=\"code-snippet__number\">0.001<\/span><\/span><span class=\"code-snippet__params\">, gamma=<\/span><span class=\"code-snippet__params\"><span class=\"code-snippet__number\">0.99<\/span><\/span><span class=\"code-snippet__params\">, epsilon=<\/span><span class=\"code-snippet__params\"><span class=\"code-snippet__number\">1.0<\/span><\/span><span class=\"code-snippet__params\">, epsilon_decay=<\/span><span class=\"code-snippet__params\"><span class=\"code-snippet__number\">0.995<\/span><\/span><span class=\"code-snippet__params\">, min_epsilon=<\/span><span class=\"code-snippet__params\"><span class=\"code-snippet__number\">0.01<\/span><\/span><span class=\"code-snippet__params\">, buffer_size=<\/span><span class=\"code-snippet__params\"><span class=\"code-snippet__number\">10000<\/span><\/span><span class=\"code-snippet__params\">, batch_size=<\/span><span class=\"code-snippet__params\"><span class=\"code-snippet__number\">64<\/span><\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.state_dim = state_dim<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.action_dim = action_dim<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.gamma = gamma<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.epsilon = epsilon<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.epsilon_decay = epsilon_decay<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.min_epsilon = min_epsilon<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.batch_size = batch_size<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.q_network = QNetwork(state_dim, action_dim)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.target_network = QNetwork(state_dim, action_dim)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.target_network.load_state_dict(self.q_network.state_dict())<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.optimizer = optim.Adam(self.q_network.parameters(), lr=lr)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.replay_buffer = deque(maxlen=buffer_size)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.criterion = nn.MSELoss()<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">choose_action<\/span>(<span class=\"code-snippet__params\">self, state<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">if<\/span>&nbsp;random.random() &lt; self.epsilon:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span>&nbsp;random.randint(<span class=\"code-snippet__number\">0<\/span>, self.action_dim -&nbsp;<span class=\"code-snippet__number\">1<\/span>)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">else<\/span>:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; state = torch.tensor([state], dtype=torch.float32)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp; q_values = self.q_network(state)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span>&nbsp;torch.argmax(q_values).item()<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">store_experience<\/span>(<span class=\"code-snippet__params\">self, state, action, reward, next_state, done<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.replay_buffer.append((state, action, reward, next_state, done))<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">update_network<\/span>(<span class=\"code-snippet__params\">self<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">if<\/span>&nbsp;<span class=\"code-snippet__built_in\">len<\/span>(self.replay_buffer) &lt; self.batch_size:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; &nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">return<\/span><\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; batch = random.sample(self.replay_buffer, self.batch_size)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; states, actions, rewards, next_states, dones =&nbsp;<span class=\"code-snippet__built_in\">zip<\/span>(*batch)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; states = torch.tensor(states, dtype=torch.float32)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; actions = torch.tensor(actions, dtype=torch.int64)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; rewards = torch.tensor(rewards, dtype=torch.float32)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; next_states = torch.tensor(next_states, dtype=torch.float32)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; dones = torch.tensor(dones, dtype=torch.float32)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; q_values = self.q_network(states).gather(<span class=\"code-snippet__number\">1<\/span>, actions.unsqueeze(<span class=\"code-snippet__number\">1<\/span>)).squeeze()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; next_q_values = self.target_network(next_states).<span class=\"code-snippet__built_in\">max<\/span>(<span class=\"code-snippet__number\">1<\/span>)[<span class=\"code-snippet__number\">0<\/span>]<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; target_q_values = rewards + self.gamma * next_q_values * (<span class=\"code-snippet__number\">1<\/span>&nbsp;- dones)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; loss = self.criterion(q_values, target_q_values)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.optimizer.zero_grad()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; loss.backward()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.optimizer.step()<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">update_target_network<\/span>(<span class=\"code-snippet__params\">self<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.target_network.load_state_dict(self.q_network.state_dict())<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">def<\/span>&nbsp;<span class=\"code-snippet__title\">decay_epsilon<\/span>(<span class=\"code-snippet__params\">self<\/span>):<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; self.epsilon =&nbsp;<span class=\"code-snippet__built_in\">max<\/span>(self.min_epsilon, self.epsilon * self.epsilon_decay)<\/span><\/code><code><span><span class=\"code-snippet__comment\"># \u73af\u5883<\/span><\/span><\/code><code><span>env = gym.make(<span class=\"code-snippet__string\">'CartPole-v1'<\/span>)<\/span><\/code><code><span>state_dim = env.observation_space.shape[<span class=\"code-snippet__number\">0<\/span>]<\/span><\/code><code><span>action_dim = env.action_space.n<\/span><\/code><code><span><span class=\"code-snippet__comment\"># \u521d\u59cb\u5316\u4ee3\u7406<\/span><\/span><\/code><code><span>agent = DQNAgent(state_dim, action_dim)<\/span><\/code><code><span><span class=\"code-snippet__comment\"># \u8bad\u7ec3\u5faa\u73af<\/span><\/span><\/code><code><span>episodes =&nbsp;<span class=\"code-snippet__number\">1000<\/span><\/span><\/code><code><span><span class=\"code-snippet__keyword\">for<\/span>&nbsp;episode&nbsp;<span class=\"code-snippet__keyword\">in<\/span>&nbsp;<span class=\"code-snippet__built_in\">range<\/span>(episodes):<\/span><\/code><code><span>&nbsp; &nbsp; state = env.reset()<\/span><\/code><code><span>&nbsp; &nbsp; total_reward =&nbsp;<span class=\"code-snippet__number\">0<\/span><\/span><\/code><code><span>&nbsp; &nbsp; done =&nbsp;<span class=\"code-snippet__literal\">False<\/span><\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__keyword\">while<\/span>&nbsp;<span class=\"code-snippet__keyword\">not<\/span>&nbsp;done:<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; action = agent.choose_action(state)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; next_state, reward, done, _ = env.step(action)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; agent.store_experience(state, action, reward, next_state, done)<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; agent.update_network()<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; state = next_state<\/span><\/code><code><span>&nbsp; &nbsp; &nbsp; &nbsp; total_reward += reward<\/span><\/code><code><span>&nbsp; &nbsp; agent.update_target_network()<\/span><\/code><code><span>&nbsp; &nbsp; agent.decay_epsilon()<\/span><\/code><code><span>&nbsp; &nbsp;&nbsp;<span class=\"code-snippet__built_in\">print<\/span>(<span class=\"code-snippet__string\">f'Episode&nbsp;<\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\">{episode +&nbsp;<\/span><\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\"><span class=\"code-snippet__number\">1<\/span><\/span><\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\">}<\/span><\/span><span class=\"code-snippet__string\">\/<\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\">{episodes}<\/span><\/span><span class=\"code-snippet__string\">, Total Reward:&nbsp;<\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\">{total_reward}<\/span><\/span><span class=\"code-snippet__string\">, Epsilon:&nbsp;<\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\">{agent.epsilon:<\/span><\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\"><span class=\"code-snippet__number\">.3<\/span><\/span><\/span><span class=\"code-snippet__string\"><span class=\"code-snippet__subst\">f}<\/span><\/span><span class=\"code-snippet__string\">'<\/span>)<\/span><\/code><code><span><span class=\"code-snippet__comment\"># \u8bc4\u4f30<\/span><\/span><\/code><code><span>state = env.reset()<\/span><\/code><code><span>done =&nbsp;<span class=\"code-snippet__literal\">False<\/span><\/span><\/code><code><span><span class=\"code-snippet__keyword\">while<\/span>&nbsp;<span class=\"code-snippet__keyword\">not<\/span>&nbsp;done:<\/span><\/code><code><span>&nbsp; &nbsp; action = agent.choose_action(state)<\/span><\/code><code><span>&nbsp; &nbsp; state, _, done, _ = env.step(action)<\/span><\/code><code><span>&nbsp; &nbsp; env.render()<\/span><\/code><code><span>env.close()<\/span><\/code><\/pre>\n<\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm3kd\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm3kd\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\", Arial, sans-serif;letter-spacing: 0.544px\">\n<section style=\"letter-spacing: 0.544px;text-align: right;font-size: 13px\">\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;text-align: center\">\n<section style=\"vertical-align: middle\">\n<section style=\"margin-bottom: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 1.4\">\n<p><strong><strong style=\"text-align: left;letter-spacing: 0.544px\"><span style=\", Arial, sans-serif\"><strong style=\"letter-spacing: 0.578px\"><span>5. DQN \u7684\u4e3b\u8981\u6539\u8fdb\u7b97\u6cd5<\/span><\/strong><\/span><\/strong><\/strong><\/p>\n<\/section>\n<section style=\"margin-top: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/h3>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;letter-spacing: 0.578px;line-height: 1.75em\"><span><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmepz\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.1 Double DQN\uff1a\u89e3\u51b3 Q \u503c\u8fc7\u9ad8\u4f30\u8ba1\u95ee\u9898<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmepz\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm17l5\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.1.1 Double DQN\u7684\u601d\u60f3<\/span><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm17l5\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-indent: 0px;text-align: center\" data-mpa-action-id=\"mel6pxjm11as\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.865\" data-type=\"png\" data-w=\"400\" height=\"346\" style=\"vertical-align: middle\" width=\"400\" data-imgfileid=\"100235170\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-f5bd58806c5e6746a73d99a0b73ffb31.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm1lt6\"><span style=\"font-size: 13px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel73tupnj6\" data-pm-slice=\"0 0 []\"><span>\u5728DQN\u4e0eDouble DQN\u4e2d\u4f7f\u7528\u76ee\u6807\u7f51\u7edc\u7684\u5b66\u4e60\u7ed3\u6784<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1lt6\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 24px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm5od\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5728\u7ecf\u5178\u7684 Q-L<\/span>earning \u53ca\u5176\u6df1\u5ea6\u7248\u672c DQN\uff08Deep Q-Network\uff09\u4e2d\uff0c\u52a8\u4f5c\u503c\u51fd\u6570\u7684\u4f30\u8ba1\u5b58\u5728\u7cfb\u7edf\u6027\u504f\u5dee\uff0c\u5373\u8fc7\u9ad8\u4f30\u8ba1\uff08overestimation bias\uff09\u3002\u8fd9\u79cd\u504f\u5dee\u6e90\u81ea\u4e8e\u6700\u5927\u5316\u64cd\u4f5c\uff1a<\/span><\/p>\n<section style=\"text-align: center\"><img class=\"rich_pages wxw-img\" data-ratio=\"0.23636363636363636\" data-s=\"300,640\" data-type=\"png\" data-w=\"660\" style=\"width:111px;height:26px\" data-imgfileid=\"100235323\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-002f3aae34ddf0201efdce11eb86f488.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm5od\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5f53\u4f30\u8ba1\u7684 Q \u503c\u5b58\u5728\u566a\u58f0\u65f6\uff0c\u76f4\u63a5\u9009\u53d6\u6700\u5927 Q \u503c\u52a8\u4f5c\u5bb9\u6613\u5bfc\u81f4\u671f\u671b\u7684\u8fc7\u9ad8\u4f30\u8ba1\uff0c\u4ece\u800c\u5f71\u54cd\u7b56\u7565\u7684\u7a33\u5b9a\u6027\u548c\u6700\u7ec8\u6027\u80fd\u3002\u4e3a\u4e86\u51cf\u5c11 DQN \u4e2d\u7684 Q \u503c\u8fc7\u9ad8\u4f30\u8ba1\uff0cDouble DQN \u5f15\u5165\u4e86\u4e24\u4e2a Q \u7f51\u7edc\uff1a\u5f53\u524d Q \u7f51\u7edc\u548c\u76ee\u6807 Q \u7f51\u7edc<\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[4]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 24px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmy1q\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7ecf\u5178 DQN \u7684\u76ee\u6807 Q \u503c\u8ba1\u7b97\u516c\u5f0f\u4e3a\uff1a<\/span><\/span><\/p>\n<section style=\"text-align: center\"><img class=\"rich_pages wxw-img\" data-ratio=\"0.11388888888888889\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"width:232px;height:27px\" data-imgfileid=\"100235324\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-05801c93de5878d6f335ef24eba924f2.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmy1q\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5176\u4e2d\uff1a&nbsp;<\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel76jrdk3y\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u662f\u5728\u65f6\u95f4\u6b65&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>t<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u83b7\u53d6\u7684\u5956\u52b1\uff0c&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b3<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u662f\u6298\u6263\u56e0\u5b50\uff0c<\/span><\/span><sub data-pm-slice=\"0 0 []\"><span><img alt=\"image.png\" class=\"rich_pages wxw-img\" data-ratio=\"0.19382022471910113\" data-type=\"png\" data-w=\"712\" style=\"vertical-align: baseline;width: 120px\" width=\"120\" data-width=\"120px\" data-imgfileid=\"100235325\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-4e0a801f1dfbbd1cfcf3ef27034c7fdb.png\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u662f\u5728\u65f6\u95f4\u6b65&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>t<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>+<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u4e0b\uff0c\u901a\u8fc7\u76ee\u6807\u7f51\u7edc&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel76quw153m\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u8ba1\u7b97\u7684\u6700\u5927 Q \u503c\uff0c\u9009\u62e9\u4e0b\u4e00\u4e2a\u72b6\u6001&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u4e2d\u7684\u6700\u4f73\u52a8\u4f5c\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 24px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm11wh\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Double DQN\u76ee\u6807 Q \u503c\u8ba1\u7b97\u516c\u5f0f\u6539\u4e3a\uff1a<\/span><\/span><\/p>\n<section style=\"text-align: center\"><img class=\"rich_pages wxw-img\" data-ratio=\"0.08518518518518518\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"width:328px;height:28px\" data-imgfileid=\"100235326\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-527050ae0ab6169a0511ef2017f17010.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 16px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm11wh\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u4f5c\u9009\u62e9\uff1a\u4f9d\u7136\u901a\u8fc7\u5f53\u524d Q \u7f51\u7edc&nbsp;<\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u6765\u9009\u62e9\u4e0b\u4e00\u4e2a\u72b6\u6001&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u4e2d\u7684\u6700\u4f18\u52a8\u4f5c\uff0c<\/span><\/span><sub data-pm-slice=\"0 0 []\"><span><img alt=\"image.png\" class=\"rich_pages wxw-img\" data-ratio=\"0.14323607427055704\" data-type=\"png\" data-w=\"754\" style=\"vertical-align: baseline;width: 164px\" width=\"164\" data-width=\"164px\" data-imgfileid=\"100235327\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-88cf7a212b57497f76b8cc687a9ab308.png\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u8fd9\u4e2a\u6b65\u9aa4\u4f7f\u7528\u7684\u662f\u5f53\u524d\u7f51\u7edc&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u6765\u9009\u62e9\u52a8\u4f5c\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm5fy\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u4f5c\u8bc4\u4f30\uff1a\u8bc4\u4f30\u8fd9\u4e2a\u52a8\u4f5c\u7684 Q \u503c\u65f6\uff0c\u4f7f\u7528\u7684\u662f\u76ee\u6807\u7f51\u7edc&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel78y4a6b6\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u5373\u8bc4\u4f30\u9009\u4e2d\u7684\u52a8\u4f5c&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel79g6b1ee1\" data-pm-slice=\"0 0 []\"><span><span>\u2217<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>&nbsp;\u5bf9\u5e94\u7684 Q \u503c\uff1a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>+<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel79inqy3n\" data-pm-slice=\"0 0 []\"><span><span>\u2217<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u03b8<\/span><\/span><sup style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel798xfpqu\" data-pm-slice=\"0 0 []\"><span><span>\u2212<\/span><\/span><\/sup><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u901a\u8fc7\u8fd9\u79cd\u65b9\u5f0f\uff0cDouble DQN \u901a\u8fc7\u5206\u5f00\u52a8\u4f5c\u9009\u62e9\u548c\u52a8\u4f5c\u8bc4\u4f30\uff0c\u907f\u514d\u4e86\u7ecf\u5178 DQN \u4e2d\u540c\u4e00\u7f51\u7edc\u540c\u65f6\u6267\u884c\u9009\u62e9\u548c\u8bc4\u4f30\u7684\u64cd\u4f5c\uff0c\u4ece\u800c\u51cf\u5c11\u4e86\u56e0\u9009\u62e9\u6700\u5927 Q \u503c\u800c\u5bfc\u81f4\u7684\u8fc7\u9ad8\u4f30\u8ba1\u504f\u5dee\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1uua\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmke9\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.1.2 Double DQN\u7684\u4f18\u52bf<\/span><\/span><\/p>\n<p><span><br \/><\/span><\/p>\n<p><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmq5r\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4f20\u7edf DQN \u5728\u66f4\u65b0\u65f6\uff0c\u76f4\u63a5\u7528\u76ee\u6807\u7f51\u7edc\u4f30\u8ba1\u7684\u6700\u5927 Q \u503c\u4f5c\u4e3a\u76ee\u6807\uff0c\u8fd9\u79cd\u201c\u6700\u5927\u5316\u201d\u64cd\u4f5c\u5bb9\u6613\u4ece\u566a\u58f0\u4e2d\u6311\u9009\u51fa\u504f\u5927\u503c\uff0c\u5bfc\u81f4\u6574\u4f53\u504f\u9ad8\u3002Double DQN \u5219\u5148\u7528\u5f53\u524d\u7f51\u7edc\u6311\u9009\u52a8\u4f5c\uff0c\u518d\u7528\u76ee\u6807\u7f51\u7edc\u8ba1\u7b97\u4ef7\u503c\uff0c\u907f\u514d\u4e86\u5355\u4e00\u7f51\u7edc\u540c\u65f6\u8d1f\u8d23\u9009\u52a8\u4f5c\u548c\u8bc4\u4f30\u52a8\u4f5c\u4ef7\u503c\u6240\u5e26\u6765\u7684\u504f\u5dee\u3002Double DQN \u662f\u4e00\u79cd\u7b80\u5355\u6709\u6548\u7684\u6539\u8fdb\u7b56\u7565\uff0c\u901a\u8fc7\u201c\u52a8\u4f5c\u9009\u62e9\u201d\u548c\u201c\u52a8\u4f5c\u8bc4\u4f30\u201d\u5206\u5f00\u4f30\u8ba1\uff0c\u663e\u8457\u7f13\u89e3\u4e86 Q \u503c\u8fc7\u9ad8\u4f30\u8ba1\u95ee\u9898\uff0c\u63d0\u9ad8\u4e86\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u7b97\u6cd5\u7684\u7a33\u5b9a\u6027\u548c\u6027\u80fd\uff0c\u5df2\u6210\u4e3a\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u9886\u57df\u7684\u91cd\u8981\u65b9\u6cd5\u4e4b\u4e00\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1hrz\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1rak\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.2 Dueling DQN\uff1a\u5206\u79bb\u72b6\u6001\u4ef7\u503c\u4e0e\u4f18\u52bf\u51fd\u6570<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1rak\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm19wd\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.2.1 Dueling DQN\u7684\u601d\u60f3<\/span><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm19wd\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjmke9\"><span style=\"font-size: 15px\" data-pm-slice=\"2 3 [&quot;para&quot;,{&quot;tagName&quot;:&quot;h4&quot;,&quot;attributes&quot;:{&quot;style&quot;:&quot;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center;&quot;,&quot;data-mpa-action-id&quot;:&quot;mel6pxjmke9&quot;},&quot;namespaceURI&quot;:&quot;http:\/\/www.w3.org\/1999\/xhtml&quot;}]\"><span><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.5333333333333333\" data-type=\"png\" data-w=\"300\" height=\"160\" style=\"vertical-align: middle\" width=\"300\" data-imgfileid=\"100235175\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-9dc68ecfa688e4bc7c03e0cb1b354ba6.png\" \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1kes\"><span style=\"font-size: 13px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-pm-slice=\"1 1 [&quot;para&quot;,{&quot;tagName&quot;:&quot;p&quot;,&quot;attributes&quot;:{&quot;style&quot;:&quot;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;&quot;,&quot;data-mpa-action-id&quot;:&quot;mel6pxjm1kes&quot;},&quot;namespaceURI&quot;:&quot;http:\/\/www.w3.org\/1999\/xhtml&quot;}]\" data-mpa-action-id=\"mel7aqvuj8c\"><span>Dueling DQN \u7f51\u7edc\u7ed3\u6784\u793a\u610f\u56fe<\/span><\/span><\/p>\n<p><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1us5\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1us5\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Dueling DQN\uff08Dueling Deep Q-Network\uff09\u662f\u5bf9\u7ecf\u5178 DQN \u7684\u4e00\u79cd\u7ed3\u6784\u6027\u6539\u8fdb\uff0c\u65e8\u5728\u63d0\u5347\u667a\u80fd\u4f53\u5728\u590d\u6742\u73af\u5883\u4e2d\u7684\u5b66\u4e60\u6548\u7387\u548c\u7a33\u5b9a\u6027<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[5]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span><span>\u5728\u4f20\u7edf\u7684 DQN \u4e2d\uff0cQ \u503c\u51fd\u6570 Q(s,a) \u76f4\u63a5\u8f93\u51fa\u6bcf\u4e2a\u52a8\u4f5c\u7684\u4ef7\u503c\u3002\u7136\u800c\uff0c\u5728\u8bb8\u591a\u60c5\u51b5\u4e0b\uff0c\u67d0\u4e9b\u72b6\u6001\u4e0b\u7684\u6240\u6709\u52a8\u4f5c\u7684\u4ef7\u503c\u5dee\u5f02\u8f83\u5c0f\uff0c\u5bfc\u81f4\u5b66\u4e60\u8fc7\u7a0b\u4e2d\u7684\u68af\u5ea6\u66f4\u65b0\u6548\u7387\u4f4e\u4e0b\u3002Dueling DQN \u901a\u8fc7\u5c06 Q \u503c\u51fd\u6570\u5206\u89e3\u4e3a\u72b6\u6001\u4ef7\u503c\u51fd\u6570 V(s) \u548c\u4f18\u52bf\u51fd\u6570 A(s,a)\uff0c\u4f7f\u5f97\u7f51\u7edc\u80fd\u591f\u5206\u522b\u8bc4\u4f30\u72b6\u6001\u7684\u603b\u4f53\u4ef7\u503c\u548c\u5404\u4e2a\u52a8\u4f5c\u7684\u76f8\u5bf9\u4f18\u52bf\uff0c\u4ece\u800c\u63d0\u9ad8\u5b66\u4e60\u6548\u7387<\/span><\/span><span style=\"font-size: 15px\"><span>\u3002\u5177\u4f53\u5730\uff0cDueling DQN \u7684 Q \u503c\u8ba1\u7b97\u516c\u5f0f\u4e3a\uff1a<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 15px\"><span><br \/><\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 15px\"><span>&nbsp;<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>=V(s)+A<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><span>)<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\">\u5176\u4e2d\uff0cV(s) \u662f\u72b6\u6001s\u7684\u4ef7\u503c\uff0c\u8868\u793a\u5728\u8be5\u72b6\u6001\u4e0b\u667a\u80fd\u4f53\u7684\u671f\u671b\u56de\u62a5\uff1bA(s,a) \u662f\u52a8\u4f5ca\u76f8\u5bf9\u4e8e\u5f53\u524d\u72b6\u6001\u7684\u4f18\u52bf\uff0c\u8868\u793a\u5728\u8be5\u72b6\u6001\u4e0b\u91c7\u53d6\u52a8\u4f5ca\u76f8\u5bf9\u4e8e\u5176\u4ed6\u52a8\u4f5c\u7684\u4f18\u52bf\u7a0b\u5ea6\u3002<\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><span>Dueling DQN \u7684\u7f51\u7edc\u7ed3\u6784\u5728\u4f20\u7edf DQN \u7684\u57fa\u7840\u4e0a\u8fdb\u884c\u4e86\u4fee\u6539\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjmo6t\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1zu8\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5177\u4f53\u800c\u8a00\uff0c\u7f51\u7edc\u7684\u524d\u51e0\u5c42\u5171\u4eab\uff0c\u7528\u4e8e\u63d0\u53d6\u8f93\u5165\u72b6\u6001\u7684\u7279\u5f81\uff1b\u7136\u540e\uff0c\u7f51\u7edc\u5206\u4e3a\u4e24\u4e2a\u5206\u652f\uff1a\u4e00\u4e2a\u7528\u4e8e\u8ba1\u7b97\u72b6\u6001\u4ef7\u503c\u51fd\u6570V(s)\uff0c\u53e6\u4e00\u4e2a\u7528\u4e8e\u8ba1\u7b97\u4f18\u52bf\u51fd\u6570 A(s,a)\u3002\u6700\u540e\uff0c\u4e24\u4e2a\u5206\u652f\u7684\u8f93\u51fa\u88ab\u5408\u5e76\uff0c\u5f97\u5230\u6bcf\u4e2a\u52a8\u4f5c\u7684 Q \u503c\u4f30\u8ba1\u3002\u8fd9\u79cd\u7ed3\u6784\u4f7f\u5f97\u7f51\u7edc\u80fd\u591f\u66f4\u6709\u6548\u5730\u5b66\u4e60\u5230\u72b6\u6001\u7684\u4ef7\u503c\u548c\u52a8\u4f5c\u7684\u4f18\u52bf\uff0c\u4ece\u800c\u63d0\u9ad8\u5b66\u4e60\u6027\u80fd\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1tix\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1zwl\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.1.2 Dueling DQN\u7684\u4f18\u52bf<\/span><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1zwl\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmimb\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09\u63d0\u9ad8\u5b66\u4e60\u6548\u7387\uff1a\u901a\u8fc7\u5206\u79bb\u72b6\u6001\u4ef7\u503c\u548c\u52a8\u4f5c\u4f18\u52bf\uff0cDueling DQN \u80fd\u591f\u66f4\u597d\u5730\u805a\u7126\u4e8e\u91cd\u8981\u4fe1\u606f\uff0c\u51cf\u5c11\u65e0\u5173\u56e0\u7d20\u5e72\u6270\uff0c\u63d0\u9ad8\u5b66\u4e60\u6548\u7387\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmimb\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm236f\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09\u589e\u5f3a\u9c81\u68d2\u6027\uff1a\u5bf9\u72b6\u6001\u4ef7\u503c\u548c\u4f18\u52bf\u7684\u72ec\u7acb\u5efa\u6a21\u6709\u52a9\u4e8e\u7f13\u89e3\u73af\u5883\u566a\u58f0\u548c\u7a00\u758f\u5956\u52b1\u5e26\u6765\u7684\u5f71\u54cd\uff0c\u63d0\u9ad8\u7b97\u6cd5\u7684\u9c81\u68d2\u6027\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm236f\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1ryh\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09\u63d0\u5347\u6cdb\u5316\u80fd\u529b\uff1aDueling \u67b6\u6784\u5141\u8bb8\u7f51\u7edc\u5728\u672a\u89c1\u8fc7\u7684\u73af\u5883\u4e2d\u66f4\u5feb\u5730\u63a8\u65ad\u51fa\u5408\u7406\u7684 Q \u503c\uff0c\u589e\u5f3a\u4e86\u7b97\u6cd5\u7684\u6cdb\u5316\u80fd\u529b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmp9f\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm148x\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.3 DRQN<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm148x\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1ckz\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.3.1 DRQN\u7684\u601d\u60f3<\/span><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1ckz\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-align: center\" data-mpa-action-id=\"mel6pxjmm5r\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.99\" data-type=\"png\" data-w=\"300\" height=\"297\" style=\"vertical-align: middle\" width=\"300\" data-imgfileid=\"100235176\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-29591863afd8db0ca12a0aea09c288a2.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm1x93\"><span style=\"font-size: 13px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7fcjxmo1\" data-pm-slice=\"0 0 []\"><span>DRQN\u67b6\u6784<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"color: #3f3f3f;font-size: 15px\"><span>Deep Recurrent Q-Network\uff08DRQN\uff09\u662f\u5bf9\u7ecf\u5178 DQN \u7684\u4e00\u79cd\u6269\u5c55\uff0c\u65e8\u5728\u89e3\u51b3\u90e8\u5206\u53ef\u89c2\u5bdf\u9a6c\u5c14\u53ef\u592b\u51b3\u7b56\u8fc7\u7a0b\uff08POMDP\uff09\u4e2d\u7684\u6311\u6218<\/span><\/span><\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[6]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002\u5728 POMDP \u4e2d\uff0c\u667a\u80fd\u4f53\u65e0\u6cd5\u83b7\u5f97\u5b8c\u6574\u7684\u73af\u5883\u72b6\u6001\u4fe1\u606f\uff0c\u4f20\u7edf\u7684 DQN \u4f9d\u8d56\u4e8e\u5b8c\u6574\u7684\u89c2\u5bdf\u5e8f\u5217\u8fdb\u884c\u51b3\u7b56\uff0c\u53ef\u80fd\u5bfc\u81f4\u6027\u80fd\u4e0b\u964d\u3002DRQN \u901a\u8fc7\u5f15\u5165\u9012\u5f52\u795e\u7ecf\u7f51\u7edc\uff08RNN\uff09\uff0c\u7279\u522b\u662f\u957f\u77ed\u671f\u8bb0\u5fc6\uff08LSTM\uff09\u7f51\u7edc\uff0c\u4f7f\u667a\u80fd\u4f53\u80fd\u591f\u5904\u7406\u90e8\u5206\u89c2\u5bdf\u4fe1\u606f\uff0c\u4fdd\u7559\u5386\u53f2\u4fe1\u606f\uff0c\u4ece\u800c\u5728\u90e8\u5206\u53ef\u89c2\u5bdf\u7684\u73af\u5883\u4e2d\u8868\u73b0\u51fa\u66f4\u597d\u7684\u6027\u80fd\u3002DRQN \u7684\u6838\u5fc3\u601d\u60f3\u662f\u5c06\u4f20\u7edf DQN \u7684\u5168\u8fde\u63a5\u5c42\u66ff\u6362\u4e3a LSTM \u5c42\uff0c\u4ee5\u4fbf\u5728\u6bcf\u4e2a\u65f6\u95f4\u6b65\u90fd\u80fd\u4fdd\u7559\u5386\u53f2\u4fe1\u606f\u3002\u5177\u4f53\u800c\u8a00\uff0cDRQN \u7684 Q \u503c\u8ba1\u7b97\u516c\u5f0f\u4e3a\uff1a<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Q<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\" data-mpa-action-id=\"mel7grlaet8\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\" data-mpa-action-id=\"mel7gtimyb3\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>=<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>LSTM<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>h<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span><span>\u2212<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><sub><span>1<\/span><\/sub><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>[<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>\u03d5<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\" data-mpa-action-id=\"mel7h6bl1i5u\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>)<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\" data-mpa-action-id=\"mel7h8dfm61\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>)<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>\u5176\u4e2d\uff0ch<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><sub><span>t<\/span><\/sub><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span><span>\u2212<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><sub><span>1<\/span><\/sub><span><span>\u662f\u4e0a\u4e00\u65f6\u95f4\u6b65\u7684\u9690\u85cf\u72b6\u6001\uff0c\u03d5<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>(<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\" data-mpa-action-id=\"mel7hcj723d7\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal;font-size: 15px\"><span>)<\/span>\u662f\u5f53\u524d\u72b6\u6001\u7684\u7279\u5f81\u8868\u793a\uff0c<span>a<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7hesn202j\" data-pm-slice=\"0 0 []\"><sub><span>t<\/span><\/sub><span><span>\u662f\u5f53\u524d\u52a8\u4f5c\u3002\u901a\u8fc7\u8fd9\u79cd\u65b9\u5f0f\uff0cDRQN \u80fd\u591f\u5728\u6bcf\u4e2a\u65f6\u95f4\u6b65\u90fd\u8003\u8651\u5230\u5386\u53f2\u4fe1\u606f\uff0c\u4ece\u800c\u66f4\u597d\u5730\u5e94\u5bf9\u90e8\u5206\u53ef\u89c2\u5bdf\u7684\u73af\u5883\u3002<\/span><\/span><\/span><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1say\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DRQN \u7684\u7f51\u7edc\u7ed3\u6784\u901a\u5e38\u5305\u62ec\u4ee5\u4e0b\u51e0\u4e2a\u90e8\u5206\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmvbe\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09\u5377\u79ef\u5c42\uff08Convolutional Layers\uff09\uff1a\u7528\u4e8e\u4ece\u8f93\u5165\u56fe\u50cf\u4e2d\u63d0\u53d6\u7279\u5f81\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmip6\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09LSTM \u5c42\uff1a\u7528\u4e8e\u5904\u7406\u65f6\u95f4\u5e8f\u5217\u6570\u636e\uff0c<\/span>\u4fdd\u7559\u5386\u53f2\u4fe1\u606f\u3002<\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1hls\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09\u5168\u8fde\u63a5\u5c42\uff08Fully Connected Layer\uff09\uff1a\u7528\u4e8e\u8f93\u51fa\u6bcf\u4e2a\u52a8\u4f5c\u7684 Q \u503c\u3002 \u8fd9\u79cd\u7ed3\u6784\u4f7f\u5f97 DRQN \u80fd\u591f\u5728\u6bcf\u4e2a\u65f6\u95f4\u6b65\u90fd\u8003\u8651\u5230\u5386\u53f2\u4fe1\u606f\uff0c\u4ece\u800c\u66f4\u597d\u5730\u5e94\u5bf9\u90e8\u5206\u53ef\u89c2\u5bdf\u7684\u73af\u5883\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1b95\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm93u\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">5.3.2 DRQN\u7684\u4f18\u52bf\u4e0e\u5c40\u9650<\/span><\/span><\/span><\/h4>\n<h4 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm93u\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h4>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm12ti\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>1.\u4f18\u52bf<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmpcq\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09\u5904\u7406\u90e8\u5206\u53ef\u89c2\u5bdf\u73af\u5883\uff1aDRQN \u80fd\u591f\u5728\u6bcf\u4e2a\u65f6\u95f4\u6b65\u90fd\u4fdd\u7559\u5386\u53f2\u4fe1\u606f\uff0c\u4ece\u800c\u5728\u90e8\u5206\u53ef\u89c2\u5bdf\u7684\u73af\u5883\u4e2d\u8868\u73b0\u51fa\u66f4\u597d\u7684\u6027\u80fd\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm7du\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09\u63d0\u9ad8\u51b3\u7b56\u8d28\u91cf\uff1a\u901a\u8fc7\u5f15\u5165 LSTM \u5c42\uff0cDRQN \u80fd\u591f\u66f4\u597d\u5730\u6355\u6349\u65f6\u95f4\u5e8f\u5217\u4e2d\u7684\u957f\u671f\u4f9d\u8d56\u5173\u7cfb\uff0c\u4ece\u800c\u63d0\u9ad8\u51b3\u7b56\u8d28\u91cf\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmqik\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09\u9002\u5e94\u6027\u5f3a\uff1aDRQN \u53ef\u4ee5\u9002\u5e94\u4e0d\u540c\u7684\u73af\u5883\u548c\u4efb\u52a1\uff0c\u5177\u6709\u8f83\u5f3a\u7684\u6cdb\u5316\u80fd\u529b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1ob0\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>2.\u5c40\u9650<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm236v\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff081\uff09\u8bad\u7ec3\u96be\u5ea6\uff1a\u7531\u4e8e\u5f15\u5165\u4e86 LSTM \u5c42\uff0cDRQN \u7684\u8bad\u7ec3\u8fc7\u7a0b\u53ef\u80fd\u6bd4\u4f20\u7edf DQN \u66f4\u52a0\u590d\u6742\u548c\u56f0\u96be\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjml9o\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff082\uff09\u8ba1\u7b97\u8d44\u6e90\u9700\u6c42\u9ad8\uff1aLSTM \u5c42\u7684\u5f15\u5165\u589e\u52a0\u4e86\u8ba1\u7b97\u91cf\uff0c\u5bf9\u786c\u4ef6\u8d44\u6e90\u7684\u8981\u6c42\u66f4\u9ad8\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmbry\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff083\uff09\u8d85\u53c2\u6570\u8c03\u4f18\u590d\u6742\uff1aLSTM \u5c42\u5f15\u5165\u4e86\u66f4\u591a\u7684\u8d85\u53c2\u6570\uff0c\u9700\u8981\u8fdb\u884c\u7cbe\u7ec6\u7684\u8c03\u4f18\u3002<\/span><\/span><\/p>\n<h2 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmmw2\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h2>\n<h2 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmmw2\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h2>\n<h3 style=\", Arial, sans-serif;letter-spacing: 0.544px\">\n<section style=\"letter-spacing: 0.544px;text-align: right;font-size: 13px\">\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;text-align: center\">\n<section style=\"vertical-align: middle\">\n<section style=\"margin-bottom: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 1.4\">\n<p><strong><strong style=\"text-align: left;letter-spacing: 0.544px\"><span style=\", Arial, sans-serif\"><strong style=\"letter-spacing: 0.578px\"><span>6. DQN \u7684\u5e94\u7528\u9886\u57df<\/span><\/strong><\/span><\/strong><\/strong><\/p>\n<\/section>\n<section style=\"margin-top: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/h3>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;letter-spacing: 0.578px;line-height: 1.75em\"><span><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjm1f5z\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">6.1 Atari \u6e38\u620f\u4e2d\u7684\u5e94\u7528\u4e0e\u8868\u73b0<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjm1f5z\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjm1f5z\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[1]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7684\u4f5c\u8005\u5728 49 \u6b3e Atria \u6e38\u620f\u4e0a\u8fdb\u884c\u6d4b\u8bd5\uff0c\u5927\u591a\u6570\u8fbe\u5230\u4e86\u4eba\u7c7b\u6c34\u5e73\uff0c\u5e76\u4e14\u6709 43 \u6b3e\u8fbe\u5230\u4e86 SOTA\uff08\u6700\u5148\u8fdb\u6c34\u5e73State-Of-The-Art\uff09\u3002\u56fe\u4e2d 100% \u548c 0% \u5206\u522b\u4ee3\u8868\u4eba\u7c7b\u6c34\u5e73\u548c\u968f\u673a\u7b56\u7565\u6c34\u5e73\u3002<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: justify\" data-mpa-action-id=\"mel6pxjm1f5z\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-align: center\" data-mpa-action-id=\"mel6pxjmbcs\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"1.2233333333333334\" data-type=\"png\" data-w=\"300\" height=\"367\" style=\"vertical-align: middle\" width=\"300\" data-imgfileid=\"100235185\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-a80ce743ee8cc8fb9c56dacdabd21ee3.png\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel7k0cpgze\" data-pm-slice=\"0 0 []\"><span style=\"font-size: 15px;, Arial, sans-serif;background-color: transparent;letter-spacing: 0.034em\"><span style=\"font-size: 13px\"><span>\u6027\u80fd\u8868\u73b0\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;background-color: transparent\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em\"><span style=\"font-size: 13px\"><span>[1]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1ugm\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">\u6027\u80fd\u8868\u73b0<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmiep\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 8px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjmiep\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN\u572849\u6b3eAtari 2600\u6e38\u620f\u4e0a\u7684\u6d4b\u8bd5\u7ed3\u679c\uff0c\u53c2\u89c1\uff0c\u5f15\u81ea<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[1]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002\u5176\u5c55\u73b0\u4e86\u7a81\u7834\u6027\u6027\u80fd\u3002\u5728\u7edf<\/span>\u4e00\u7f51\u7edc\u67b6\u6784\u3001\u7b97\u6cd5\u548c\u8d85\u53c2\u6570\u7684\u524d\u63d0\u4e0b\uff0c\u4ec5\u4ee5\u539f\u59cb\u50cf\u7d20\u548c\u6e38\u620f\u5206\u6570\u4e3a\u8f93\u5165\uff0cDQN\u572843\u6b3e\u6e38\u620f\u4e2d\u8d85\u8d8a\u4e86\u6b64\u524d\u6240\u6709\u5f3a\u5316\u5b66\u4e60\u7b97\u6cd5\uff08\u5982\u7ebf\u6027\u51fd\u6570\u903c\u8fd1\u548cSARSA\uff09\u3002\u66f4\u663e\u8457\u7684\u662f\uff0c\u5176\u8868\u73b0\u8fbe\u5230\u4eba\u7c7b\u4e13\u4e1a\u73a9\u5bb6\u6c34\u5e73\u768475%\u4ee5\u4e0a\u7684\u6e38\u620f\u4e2d\u536029\u6b3e\uff08\u8d85\u8fc7\u603b\u6570\u534a\u6570\uff09\u3002\u5178\u578b\u6848\u4f8b\u5982\uff1a<\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Breakout\u4e2d\uff0cDQN\u5f97\u5206\u8fbe401.2\uff08\u968f\u673a\u7b56\u7565\u4e3a1.7\uff0c\u4eba\u7c7b\u4e3a31.8\uff09\uff0c\u76f8\u5f53\u4e8e\u4eba\u7c7b\u6c34\u5e73\u76841327%\u3002\u5176\u6210\u529f\u6e90\u4e8e\u81ea\u4e3b\u5b66\u4f1a&#8221;\u6316\u96a7\u9053&#8221;\u7b56\u7565\uff1a\u4f18\u5148\u51fb\u788e\u4fa7\u8fb9\u7816\u5757\uff0c\u5f15\u5bfc\u7403\u4f53\u4ece\u540e\u65b9\u7834\u574f\u6574\u5217\u7816\u5757\u3002<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Pong\u4ee518.9\u5206\uff08\u4eba\u7c7b9.3\u5206\uff09\u5b9e\u73b0132%\u7684\u4eba\u7c7b\u6c34\u5e73\uff0c\u52a8\u4f5c\u4ef7\u503c\u9884\u6d4b\u7cbe\u51c6\uff1b<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Video Pinball\u66f4\u4ee542,684\u5206\uff08\u4eba\u7c7b17,298\u5206\uff09\u8fbe\u62102539%\u7684\u4eba\u7c7b\u6c34\u5e73\uff0c\u8bc1\u660e\u5bf9\u590d\u6742\u7269\u7406\u673a\u5236\u7684\u9ad8\u6548\u5229\u7528\u3002<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm15qk\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm15qk\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8bad\u7ec3\u8fc7\u7a0b\u7a33\u5b9a\u6027\u901a\u8fc7\u5e73\u5747\u6bcf\u5c40\u5f97\u5206\u548c\u9884\u6d4bQ\u503c\u66f2\u7ebf\u5f97\u5230\u9a8c\u8bc1\uff0c\u89c1\u56fe,<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm15qk\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-align: center\" data-mpa-action-id=\"mel6pxjm1rnp\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.6\" data-type=\"jpeg\" data-w=\"300\" height=\"180\" style=\"vertical-align: middle\" width=\"300\" data-imgfileid=\"100235187\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-5840ecaf775e06183be0b9c84733acbe.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjm1vlm\"><span style=\"font-size: 15px\" data-mpa-action-id=\"mel7mdzk17k9\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>\u9884\u6d4bQ\u503c\u66f2\u7ebf\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>[1]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1k6i\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e8c\u8005\u5747\u968f\u8bad\u7a33\u6b65\u4e0a\u5347\uff0c\u672a\u51fa\u73b0\u4f20Q\u5b66\u4e60\u7684\u53d1\u6563\u73b0\u8c61\u3002\u5956\u52b1\u88c1\u526a\u7b56\u7565\uff08\u6b63\u5956\u52b1+1\uff0c\u8d1f\u5956\u52b1-1\uff09\u5219\u786e\u4fdd\u4e86\u4e0d\u540c\u6e38\u620f\u95f4\u5b66\u4e60\u7387\u7684\u4e00\u81f4\u6027\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1xct\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1htf\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">\u6cdb\u5316\u4e0e\u8868\u5f81\u80fd\u529b<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1htf\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1exq\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN\u7684\u6838\u5fc3\u7a81\u7834\u5728\u4e8e\u5176\u4ece\u9ad8\u7ef4\u8f93\u5165\u4e2d\u5b66\u4e60\u901a\u7528\u8868\u5f81\u7684\u80fd\u529b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjm1exq\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn172t\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u901a\u8fc7t-SNE\u964d\u7ef4\u53ef\u89c6\u5316\uff0cDQN\u7684\u6700\u7ec8\u9690\u85cf\u5c42\u8868\u5f81\u663e\u793a\uff1a<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn23i\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn23i\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u611f<\/span>\u77e5\u76f8\u4f3c\u72b6\u6001\uff08\u5982\u654c\u673a\u5bc6\u96c6\u6392\u5217\u7684\u5c4f\u5e55\uff09\u88ab\u6620\u5c04\u5230\u5d4c\u5165\u7a7a\u95f4\u7684\u76f8\u90bb\u4f4d\u7f6e\uff0c\u89c1\u56fe;<\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn23i\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;text-align: center\" data-mpa-action-id=\"mel6pxjnjp6\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.7466666666666667\" data-type=\"jpeg\" data-w=\"300\" height=\"224\" style=\"vertical-align: middle\" width=\"300\" data-imgfileid=\"100235186\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-7f87656e17890a5544535877b26e9294.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjngki\"><span style=\"font-size: 15px\" data-mpa-action-id=\"mel7ndurkfu\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>\u4eba\u7c7b\u8868\u5f81\u5bf9\u6bd4\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>[1]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn18l\"><span><br \/><\/span><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5956\u52b1\u7b49\u4ef7\u4f46\u77e5\u4e0d\u540c\u72b6\u6001\uff08\u5982\u6e38\u620f\u5c3e\u9636\u6bb5\u7684\u63a9\u4f53\u573a\u666f\uff09\u540c\u6837\u88ab\u805a\u7c7b\u2014\u2014\u8fd9\u4e9b\u72b6\u6001\u56e0\u5373\u65f6\u5956\u52b1\u6f5c\u529b\u4f4e\u88ab\u8d4b\u4e88\u76f8\u4f3c\u4ef7\u503c\uff08V\u503c\uff09\uff0c\u8bc1\u660e\u7f51\u7edc\u8d85\u8d8a\u4e86\u8868\u5c42\u50cf\u7d20\u7279\u5f81\uff0c\u5b66\u4f1a\u4e86\u4e0e\u51b3\u7b56\u76f8\u5173\u7684\u62bd\u8c61\u7279\u5f81\u3002 \u8fdb\u4e00\u6b65\u5b9e\u9a8c\u8868\u660e\uff0c\u8be5\u8868\u5f81\u53ef\u6cdb\u5316\u81f3\u4eba\u7c7b\u73a9\u5bb6\u4ea7\u751f\u7684\u72b6\u6001\uff1a\u5c06\u4eba\u7c7b30\u5206\u949f\u6e38\u620f\u6570\u636e\u8f93\u5165DQN\u7f51\u7edc\uff0c\u5176t-SNE\u5d4c\u5165\u4e0e\u667a\u80fd\u4f53\u81ea\u8eab2\u5c0f\u65f6\u6e38\u620f\u6570\u636e\u7684\u5d4c\u5165\u7ed3\u6784\u9ad8\u5ea6\u91cd\u53e0\uff0c\u8bc1\u660e\u8868\u5f81\u4e0d\u53d7\u7b56\u7565\u4f9d\u8d56\u6027\u7684\u9650\u5236\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn23a0\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4ef7\u503c\u51fd\u6570\u7684\u9884\u6d4b\u80fd\u529b\u901a\u8fc7\u5177\u4f53\u6848\u4f8b\u5f97\u5230\u9a8c\u8bc1\uff1a<\/span><\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Breakout\u4e2d\uff0c\u5f53\u667a\u80fd\u4f53\u5373\u5c06\u201c\u6316\u901a\u201d\u7816\u5899\u65f6\uff0cQ\u503c\u8dc3\u5347\u81f323\uff0c\u9884\u793a\u540e\u7eed\u81ea\u52a8\u6e05\u5c4f\u7684\u9ad8\u6536\u76ca\uff1b<\/span><\/span><\/span><\/li>\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>Pong\u4e2d\uff0c\u82e5\u7403\u4f53\u63a5\u8fd1\u7403\u62cd\u65f6\u9009\u62e9\u201c\u5411\u4e0b\u201d\u52a8\u4f5c\uff0cQ\u503c\u5b9e\u65f6\u964d\u81f3-0.9\uff0c\u51c6\u786e\u53cd\u6620\u4e22\u5931\u7403\u4f53\u7684\u98ce\u9669\u3002<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnirf\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnirf\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u4e9b\u7ed3\u679c\u8bc1\u660e\uff0cDQN\u901a\u8fc7\u7aef\u5230\u7aef\u8bad\u7ec3\u6784\u5efa\u7684\u8868\u5f81\u80fd\u540c\u65f6\u652f\u6301\u611f\u77e5\u6cdb\u5316\u4e0e\u957f\u671f\u4ef7\u503c\u63a8\u7406\u3002<\/span><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn17a4\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn17a4\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">6.2 \u673a\u5668\u4eba\u63a7\u5236\u4e0e\u8def\u5f84\u89c4\u5212<\/span><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnwly\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnwly\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u53c2\u8003\u7efc\u8ff0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[7]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u4e9b\u65b9\u6cd5\u90fd\u662f\u4f7f\u7528DQN\u76f4\u63a5\u4ece\u539f\u59cb\u4f20\u611f\u5668\u6570\u636e\u6620\u5c04\u5230\u52a8\u4f5c\uff0c\u65e0\u9700\u4f9d\u8d56\u9884\u5148\u6784\u5efa\u7684\u73af\u5883\u6a21\u578b\u6216\u5148\u9a8c\u77e5\u8bc6\u3002<\/span><\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8f93\u5165\u7c7b\u578b\uff1a\u5305\u62ecRGB\u56fe\u50cf\u3001\u6df1\u5ea6\u56fe\u50cf\u3001\u6fc0\u5149\u96f7\u8fbe\u70b9\u4e91\u7b49\uff0c\u7528\u4e8e\u611f\u77e5\u73af\u5883\u72b6\u6001\u3002<\/span><\/span><\/section>\n<\/li>\n<li>\n<section style=\"margin-bottom: 0px;line-height: 1.75em\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8f93\u51fa\u52a8\u4f5c\uff1a\u79bb\u6563\u52a8\u4f5c\u7a7a\u95f4\uff08\u5982\u524d\u8fdb\u3001\u5de6\u8f6c\u3001\u53f3\u8f6c\uff09\uff0c\u9002\u7528\u4e8e\u5bfc\u822a\u548c\u907f\u969c\u4efb\u52a1\u3002<\/span><\/span><\/section>\n<\/li>\n<\/ul>\n<section style=\"margin-bottom: 0px\"><span><br \/><\/span><\/section>\n<section style=\"font-size: 17px;, Arial, sans-serif;line-height: 1.75em;letter-spacing: 0.034em;font-style: normal;font-weight: normal;margin-left: 8px;margin-right: 8px;margin-bottom: 0px\" data-mpa-action-id=\"mel6pxjn43k\"><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.5233333333333333\" data-type=\"jpeg\" data-w=\"600\" height=\"314\" style=\"border:0px;vertical-align:middle;margin:0px;background-color:transparent;width:100%\" width=\"600\" data-backw=\"562\" data-backh=\"294\" data-imgfileid=\"100235188\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-85136c388dfa46e1642fd7a8d6dd06d9.jpeg\" \/><\/section>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1vp5\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">\u5178\u578b\u5e94\u7528\u6848\u4f8b<\/span><\/span><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5ba4\u5185\u5bfc\u822a\u4e0e\u907f\u969c\uff1aTai\u7b49\u4eba\uff082017\uff09<\/span>[8]<span>\uff1a\u4f7f\u7528\u6df1\u5ea6\u56fe\u50cf\u4f5c\u4e3a\u8f93\u5165\uff0c\u8bad\u7ec3\u8f6e\u5f0f\u673a\u5668\u4eba\u5728\u8d70\u5eca\u73af\u5883\u4e2d\u5b9e\u73b0\u65e0\u5730\u56fe\u5bfc\u822a\uff0c\u8f93\u51fa\u8fde\u7eed\u8f6c\u5411\u6307\u4ee4\u3002Zhang\u7b49\u4eba\uff082020\uff09<\/span>[9]<span>\uff1a\u901a\u8fc7\u7279\u5f81\u8fc1\u79fb\u7b56\u7565\uff0c\u5c06\u4eff\u771f\u73af\u5883\u8bad\u7ec3\u7684DQN\u6a21\u578b\u8fc1\u79fb\u81f3\u771f\u5b9e\u673a\u5668\u4eba\uff0c\u89e3\u51b3\u4eff\u771f\u5230\u73b0\u5b9e\uff08Sim-to-Real\uff09\u7684\u6cdb\u5316\u95ee\u9898\u3002Barron\u7b49\u4eba\uff082019\uff09<\/span>[10]<span>\uff1a\u57283D\u865a\u62df\u73af\u5883\u4e2d\uff0c\u91c7\u7528RGB\u56fe\u50cf\u8f93\u5165\u8bad\u7ec3\u673a\u5668\u4eba\uff0c\u5728\u590d\u6742\u81ea\u7136\u573a\u666f\u4e2d\u5b9e\u73b0\u4f18\u4e8e\u6df1\u5ea6\u8f93\u5165\u7684\u5bfc\u822a\u6027\u80fd\u3002<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn20qf\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u672a\u77e5\u73af\u5883\u63a2\u7d22\uff1aHaora\u7b49\u4eba\uff082020\uff09[11]\uff1a\u63d0\u51fa\u81ea\u9002\u5e94\u5168\u5377\u79efQ\u7f51\u7edc\uff08AFCQN\uff09\uff0c\u7ed3\u5408\u5c40\u90e8\u5730\u56fe\u4fe1\u606f\uff0c\u663e\u8457\u964d\u4f4e\u672a\u77e5\u73af\u5883\u4e2d\u7684\u5bfc\u822a\u5931\u8d25\u7387\u3002<\/span><\/span><\/span><\/li>\n<\/ul>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnd7u\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<ul style=\"margin-left: 8px;margin-right: 8px\" class=\"list-paddingleft-1\">\n<li><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u65e0\u4eba\u673a\u63a7\u5236\uff1aKang\u7b49\u4eba\uff082019\uff09[12]\uff1a\u4ec5\u7528\u5355\u76ee\u89c6\u89c9\u8f93\u5165\uff0c\u8bad\u7ec3\u56db\u65cb\u7ffc\u65e0\u4eba\u673a\u5728\u771f\u5b9e\u73af\u5883\u4e2d\u5b9e\u73b0\u52a8\u6001\u907f\u969c\u3002<\/span><\/span><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><span style=\"font-size: 15px\"><\/span><\/li>\n<\/ul>\n<section style=\"margin-bottom: 0px\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;line-height: 1.6;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;line-height: 1.75em\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5f53\u7136\u4e5f\u5b58\u5728\u4e00\u4e9b\u5c40\u9650\u6027\uff0c\u6bd4\u5982DQN \u4ec5\u652f\u6301\u79bb\u6563\u52a8\u4f5c\uff0c\u65e0\u6cd5\u76f4\u63a5\u5e94\u7528\u4e8e\u8fde\u7eed\u63a7\u5236\uff08\u5982\u65e0\u4eba\u673a\u7cbe\u7ec6\u59ff\u6001\u8c03\u6574\uff09\uff0c\u9700\u4f9d\u8d56DDPG\u7b49\u7b97\u6cd5\u8865\u5145\u3002\u8bad\u7ec3\u9700\u5927\u91cf\u4ea4\u4e92\u6570\u636e\uff0c\u73b0\u5b9e\u573a\u666f\u4e2d\u6570\u636e\u91c7\u96c6\u6210\u672c\u9ad8\u3002\u7a00\u758f\u5956\u52b1\u73af\u5883\u4e0b\uff08\u5982\u76ee\u6807\u8ddd\u79bb\u8fdc\uff09\uff0c\u5b66\u4e60\u6548\u7387\u4e0b\u964d\u3002\u5c31\u662fDQN \u901a\u8fc7\u7aef\u5230\u7aef\u5b66\u4e60\u4e0e\u7ecf\u9a8c\u56de\u653e\u673a\u5236\uff0c\u5728\u79fb\u52a8\u673a\u5668\u4eba\u89c6\u89c9\u5bfc\u822a\u3001\u5ba4\u5185\u907f\u969c\u53ca\u65e0\u4eba\u673a\u63a7\u5236\u4e2d\u53d6\u5f97\u663e\u8457\u6210\u679c\u3002\u5176\u6838\u5fc3\u4ef7\u503c\u5728\u4e8e\u5904\u7406\u9ad8\u7ef4\u611f\u77e5\u6570\u636e\u7684\u80fd\u529b\u548c\u7b97\u6cd5\u7a33\u5b9a\u6027\uff0c\u4f46\u9700\u7ed3\u5408\u6539\u8fdb\u6280\u672f\uff08\u5982Double DQN\u3001Rainbow\uff09\u4ee5\u63d0\u5347\u6027\u80fd\u3002\u672a\u6765\u7814\u7a76\u9700\u89e3\u51b3\u8fde\u7eed\u52a8\u4f5c\u652f\u6301\u4e0e\u6837\u672c\u6548\u7387\u95ee\u9898\uff0c\u4ee5\u6269\u5927\u5e94\u7528\u573a\u666f\u3002<\/span><\/span><\/span><\/section>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1r8m\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">6.3 \u63a8\u8350\u7cfb\u7edf\u4e2d\u7684\u7b56\u7565\u4f18\u5316<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1r8m\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn125o\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u6587\u7ae0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[13]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u63d0\u4f9b\u4e86\u5f3a\u5316\u5b66\u4e60\u5728\u63a8\u8350\u7cfb\u7edf\u4e2d\u7684\u5e94\u7528\uff0c\u5177\u4f53\u601d\u8def\u6d41\u7a0b\u89c1\u53f3\u56fe\u6240\u793a\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn125o\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjn125o\"><span style=\"font-size: 15px\"><span><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.492\" data-type=\"jpeg\" data-w=\"500\" height=\"246\" style=\"vertical-align: middle\" width=\"500\" data-imgfileid=\"100235143\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-9c18bc1056869ad3c982dc3bc0b26b0f.jpeg\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjn23j6\"><span style=\"font-size: 15px\" data-mpa-action-id=\"mel7qtwmyup\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>\u57fa\u4e8e\u5f3a\u5316\u5b66\u4e60\u7684\u63a8\u8350\u7cfb\u7edf\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>[13]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn23j6\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnv8j\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u5176\u4e2d\uff0c\u6df1\u5ea6Q\u7f51\u7edc\uff08DQN\uff09\u901a\u8fc7\u5efa\u6a21\u7528\u6237\u52a8\u6001\u504f\u597d\u548c\u957f\u671f\u4ef7\u503c\uff0c\u89e3\u51b3\u4e86\u4f20\u7edf\u63a8\u8350\u7cfb\u7edf\u9762\u4e34\u7684\u63a2\u7d22-\u5229\u7528\u56f0\u5883\u548c\u5ef6\u8fdf\u5956\u52b1\u4f18\u5316\u95ee\u9898\u3002\u5176\u6838\u5fc3\u601d\u60f3\u662f\u5c06\u63a8\u8350\u89c6\u4e3a\u5e8f\u5217\u51b3\u7b56\u8fc7\u7a0b\uff1a\u7528\u6237\u72b6\u6001&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7reu5l8g\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u5386\u53f2\u4ea4\u4e92\u7279\u5f81\uff0c\u52a8\u4f5c&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7r6n6ywi\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u5f85\u63a8\u8350\u7269\u54c1\uff0c\u5956\u52b1&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>r<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7r4ek2yx\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u70b9\u51fb\/\u8f6c\u5316\u7b49\u53cd\u9988\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1sz5\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">\u95ee\u9898\u5efa\u6a21\u4e0e\u4f18\u52bf<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1sz5\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn197\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u6001\u504f\u597d\u6355\u6349\uff08vs. \u9759\u6001\u534f\u540c\u8fc7\u6ee4\uff09\uff1a DQN\u901a\u8fc7\u65f6\u5e8f\u72b6\u6001\u8f6c\u79fb\uff08&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7rx6lfbg\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u2192<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7rzq815g\" data-pm-slice=\"0 0 []\"><sub><span>t+1<\/span><\/sub><span><span>\uff09\u5b9e\u65f6\u66f4\u65b0\u7528\u6237\u5174\u8da3\u8868\u5f81\uff0c\u514b\u670d\u534f\u540c\u8fc7\u6ee4\u7684\u9759\u6001\u5efa\u6a21\u5c40\u9650\u3002<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn197\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7rzq815g\" data-pm-slice=\"0 0 []\"><span><br \/><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn13sg\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u957f\u671f\u4ef7\u503c\u4f18\u5316\uff08vs. \u5373\u65f6\u6536\u76ca\u6a21\u578b\uff09\uff1a\u6700\u5927\u5316\u7d2f\u8ba1\u5956\u52b1<\/span><\/span><sub data-pm-slice=\"0 0 []\"><span><img alt=\"image.png\" class=\"rich_pages wxw-img\" data-ratio=\"0.23636363636363636\" data-type=\"png\" data-w=\"660\" style=\"vertical-align: baseline;width: 84px\" width=\"84\" data-width=\"84px\" data-imgfileid=\"100235328\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-02f943761ca5d406a0b04c303b7be8b3.png\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff0c\u907f\u514d\u77ed\u89c6\u7b56\u7565\uff08\u5982\u4ec5\u63a8\u8350\u70ed\u95e8\u5546\u54c1\uff09\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn13sg\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1u8u\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u63a2\u7d22\u673a\u5236\uff1a\u03b5-greedy\u7b56\u7565\u4e3b\u52a8\u63a8\u8350\u4f4e\u66dd\u5149\u5546\u54c1\uff0c\u7f13\u89e3\u51b7\u542f\u52a8\u95ee\u9898\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1a2i\"><span><br \/><\/span><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">\u6280\u672f\u5b9e\u73b0\u67b6\u6784<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1a2i\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnte2\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u72b6\u6001\u8868\u5f81\uff1a\u7528\u6237\u753b\u50cf\uff08\u6027\u522b\/\u5e74\u9f84\uff09 + \u884c\u4e3a\u5e8f\u5217\uff08\u70b9\u51fb\/\u8d2d\u4e70\u5386\u53f2\uff09 \u2192 \u5d4c\u5165\u5c42 \u2192 LSTM\u7f16\u7801 \u2192 \u72b6\u6001\u5411\u91cf&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>s<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7t2n1lz0\" data-pm-slice=\"0 0 []\"><span><span>t<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnjjq\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnjjq\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u52a8\u4f5c\u7a7a\u95f4\uff1a\u79bb\u6563\u5019\u9009\u7269\u54c1\u96c6&nbsp;<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7tcgw17dg\" data-pm-slice=\"0 0 []\"><span><span>1<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7tefe1jxx\" data-pm-slice=\"0 0 []\"><span><span>2<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>.<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>.<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>.<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>,<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>a<\/span><\/span><sub style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\" data-mpa-action-id=\"mel7tgmxedn\" data-pm-slice=\"0 0 []\"><span><span>N<\/span><\/span><\/sub><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\uff08N=\u5343\u81f3\u767e\u4e07\u7ea7\uff09\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnjjq\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn18hw\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u7f51\u7edc\u7ed3\u6784\u5982\u53f3\u56fe\u6240\u793a\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn18hw\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjn18hw\"><span><img loading=\"lazy\" class=\"rich_pages wxw-img\" data-ratio=\"0.778\" data-type=\"jpeg\" data-w=\"500\" height=\"389\" style=\"vertical-align: middle\" width=\"500\" data-imgfileid=\"100235144\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-362322ada05ae875b8d48f7686a95c95.jpeg\" \/><img class=\"rich_pages wxw-img\" \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjn7r1\"><span style=\"font-size: 15px\" data-mpa-action-id=\"mel7tsqc1vik\" data-pm-slice=\"0 0 []\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>\u57fa\u4e8edqn\u7684\u63a8\u8350\u7cfb\u7edf\u7b97\u6cd5\uff0c\u5f15\u81ea<\/span><\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-size: 13px\"><span>[13]<\/span><\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn21mr\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h2 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnka6\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h2>\n<h3 style=\", Arial, sans-serif;letter-spacing: 0.544px\">\n<section style=\"letter-spacing: 0.544px;text-align: right;font-size: 13px\">\n<section style=\"margin-top: 10px;margin-bottom: 10px;letter-spacing: 0.544px;text-align: center\">\n<section style=\"vertical-align: middle\">\n<section style=\"margin-bottom: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"clear: both;line-height: 0\">\n<section style=\"line-height: 0;width: 0px\"><\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 1.4\">\n<p><strong><strong style=\"text-align: left;letter-spacing: 0.544px\"><span style=\", Arial, sans-serif\"><strong style=\"letter-spacing: 0.578px\"><span>7. DQN \u7684\u5c40\u9650\u6027\u4e0e\u6311\u6218<\/span><\/strong><\/span><\/strong><\/strong><\/p>\n<\/section>\n<section style=\"margin-top: -2px;, Arial, sans-serif\">\n<section style=\"float: left;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<section style=\"float: right;width: 8px;height: 3px;line-height: 0\"><span><br \/><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/h3>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;letter-spacing: 0.578px;line-height: 1.75em\"><span><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1lc9\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">7.1 \u5bf9\u8fde\u7eed\u52a8\u4f5c\u7a7a\u95f4\u7684\u5904\u7406\u56f0\u96be<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1yjl\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnjgm\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN \u4f5c\u4e3a\u4e00\u4e2a\u57fa\u4e8e\u79bb\u6563\u52a8\u4f5c\u7a7a\u95f4\u7684\u7b97\u6cd5\uff0c\u5728\u9762\u5bf9\u8fde\u7eed\u52a8\u4f5c\u7a7a\u95f4\u65f6\u8868\u73b0\u4e0d\u4f73\u3002\u4f20\u7edf\u7684 DQN \u5c06\u52a8\u4f5c\u7a7a\u95f4\u79bb\u6563\u5316\u4e3a\u6709\u9650\u7684\u51e0\u79cd\u9009\u62e9\uff0c\u5e76\u5bf9\u6bcf\u4e00\u4e2a\u52a8\u4f5c\u5206\u522b\u8fdb\u884c Q \u503c\u66f4\u65b0\u3002\u7136\u800c\uff0c\u5728\u5b9e\u9645\u5e94\u7528\u4e2d\uff0c\u8bb8\u591a\u4efb\u52a1\u8981\u6c42\u5728\u8fde\u7eed\u7684\u52a8\u4f5c\u7a7a\u95f4\u4e2d\u8fdb\u884c\u9009\u62e9\uff08\u5982\u673a\u5668\u4eba\u63a7\u5236\u3001\u81ea\u52a8\u9a7e\u9a76\u7b49\uff09\uff0c\u8fd9\u4f7f\u5f97 DQN \u96be\u4ee5\u76f4\u63a5\u5e94\u7528\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1qxw\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjndoj\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u4e86\u89e3\u51b3\u8fd9\u4e2a\u95ee\u9898\uff0c\u7814\u7a76\u8005\u4eec\u63d0\u51fa\u4e86\u5982\u6df1\u5ea6\u786e\u5b9a\u6027\u7b56\u7565\u68af\u5ea6\uff08DDPG\uff09<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[14]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u3001\u8f6f\u884c\u4e3a\u8005-\u8bc4\u8bba\u5bb6\uff08SAC\uff09\u7b49\u7b97\u6cd5\uff0c\u8fd9\u4e9b\u7b97\u6cd5\u4f7f\u7528\u8fde\u7eed\u7684\u7b56\u7565\u8f93\u51fa\uff0c\u5e76\u7ed3\u5408\u7b56\u7565\u68af\u5ea6\u65b9\u6cd5\u6765\u4f18\u5316\u8fde\u7eed\u52a8\u4f5c\u7a7a\u95f4\u4e2d\u7684\u51b3\u7b56\u8fc7\u7a0b\u3002\u7136\u800c\uff0cDQN \u5728\u5904\u7406\u8fde\u7eed\u52a8\u4f5c\u7a7a\u95f4\u65f6\u7684\u9002\u5e94\u6027\u4ecd\u7136\u662f\u4e00\u4e2a\u4e9f\u5f85\u89e3\u51b3\u7684\u96be\u9898\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1rpf\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn11t1\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">7.2 \u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u7684\u6837\u672c\u6548\u7387\u95ee\u9898<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1fat\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1y95\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN \u5728\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u9700\u8981\u5927\u91cf\u7684\u4e0e\u73af\u5883\u7684\u4ea4\u4e92\u6570\u636e\uff0c\u624d\u80fd\u6709\u6548\u5730\u5b66\u4e60\u5230\u6700\u4f18\u7b56\u7565\uff0c\u8fd9\u4f7f\u5f97\u6837\u672c\u6548\u7387\u4f4e\u4e0b\u3002\u4e3a\u4e86\u51cf\u5c11\u8bad\u7ec3\u65f6\u95f4\uff0cDQN \u5f15\u5165\u4e86\u7ecf\u9a8c\u56de\u653e\uff08Experience Replay\uff09\u673a\u5236\uff0c\u5c06\u5386\u53f2\u7ecf\u9a8c\u5b58\u50a8\u5728\u56de\u653e\u7f13\u51b2\u533a\uff0c\u5e76\u5728\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u968f\u673a\u62bd\u53d6\u6837\u672c\u8fdb\u884c\u5b66\u4e60\u3002\u867d\u7136\u8fd9\u79cd\u65b9\u6cd5\u80fd\u6709\u6548\u7f13\u89e3\u76f8\u5173\u6027\u5e26\u6765\u7684\u95ee\u9898\uff0c\u4f46\u5b83\u5e76\u4e0d\u80fd\u4ece\u6839\u672c\u4e0a\u89e3\u51b3\u6837\u672c\u6548\u7387\u95ee\u9898\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn7uq\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1cs9\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4f4e\u6837\u672c\u6548\u7387\u4f7f\u5f97 DQN \u5728\u9700\u8981\u5feb\u901f\u53cd\u5e94\u6216\u4ea4\u4e92\u53d7\u9650\u7684\u73af\u5883\u4e2d\uff08\u5982\u73b0\u5b9e\u4e16\u754c\u4e2d\u7684\u673a\u5668\u4eba\u63a7\u5236\uff09\u8868\u73b0\u4e0d\u7406\u60f3\u3002\u6b64\u5916\uff0c\u8bad\u7ec3\u6570\u636e\u7684\u9ad8\u9700\u6c42\u589e\u52a0\u4e86\u8ba1\u7b97\u5f00\u9500\uff0c\u5e76\u4e14\u53ef\u80fd\u5bfc\u81f4\u7b97\u6cd5\u5728\u5b9e\u9645\u4efb\u52a1\u4e2d\u7684\u5e94\u7528\u4e0d\u591f\u7075\u6d3b\u3002\u6587\u7ae0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[15]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u63d0\u51fa\u4e86Rainbow DQN\uff0c\u5c06\u591a\u79cd DQN \u7684\u6539\u8fdb\u6280\u672f\u878d\u5408\uff0c\u4ee5\u63d0\u9ad8 DQN \u7684\u7a33\u5b9a\u6027\u548c\u6837\u672c\u6548\u7387\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1c5t\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn150c\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">7.3 \u7b56\u7565\u6536\u655b\u901f\u5ea6\u6162\u4e0e\u7a33\u5b9a\u6027\u95ee\u9898<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1myx\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1niw\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN \u7684\u8bad\u7ec3\u8fc7\u7a0b\u901a\u5e38\u5b58\u5728\u6536\u655b\u901f\u5ea6\u6162\u548c\u8bad\u7ec3\u4e0d\u7a33\u5b9a\u7684\u95ee\u9898\u3002\u7531\u4e8e Q \u503c\u51fd\u6570\u662f\u901a\u8fc7\u795e\u7ecf\u7f51\u7edc\u903c\u8fd1\u7684\uff0c\u800c\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u672c\u8eab\u5bb9\u6613\u51fa\u73b0\u68af\u5ea6\u7206\u70b8\u3001\u68af\u5ea6\u6d88\u5931\u7b49\u95ee\u9898\uff0c\u8fd9\u4f1a\u5bfc\u81f4\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u7684\u4e0d\u7a33\u5b9a\u3002\u6b64\u5916\uff0cQ \u503c\u66f4\u65b0\u8fc7\u7a0b\u4e2d\u7684\u76ee\u6807\u503c\uff08\u5373\u6700\u5927\u5316\u7684 Q \u503c\uff09\u901a\u5e38\u4f1a\u53d1\u751f\u53d8\u5316\uff0c\u5bfc\u81f4\u76ee\u6807\u7f51\u7edc\u548c\u884c\u4e3a\u7f51\u7edc\u4e4b\u95f4\u7684\u4e0d\u4e00\u81f4\uff0c\u8fd9\u4f1a\u8fdb\u4e00\u6b65\u52a0\u5267\u8bad\u7ec3\u7684\u9707\u8361\u548c\u4e0d\u7a33\u5b9a\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn3wf\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1ful\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4e3a\u4e86\u63d0\u9ad8\u7a33\u5b9a\u6027\uff0cDQN \u5f15\u5165\u4e86\u76ee\u6807\u7f51\u7edc\uff08Target Network\uff09\u548c\u7ecf\u9a8c\u56de\u653e\u673a\u5236\u3002\u76ee\u6807\u7f51\u7edc\u7684\u5f15\u5165\u4f7f\u5f97 Q \u503c\u7684\u66f4\u65b0\u76ee\u6807\u5728\u4e00\u5b9a\u65f6\u95f4\u5185\u4fdd\u6301\u4e0d\u53d8\uff0c\u4ece\u800c\u907f\u514d\u4e86\u76ee\u6807\u7f51\u7edc\u7684\u4e0d\u65ad\u53d8\u5316\u5bf9\u8bad\u7ec3\u8fc7\u7a0b\u7684\u5f71\u54cd\u3002\u6587\u7ae0<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>[16]<\/span><\/span><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u4ecb\u7ecd\u4e86 PPO \u7b97\u6cd5\uff0c\u89e3\u51b3\u4e86\u7b56\u7565\u4f18\u5316\u4e2d\u7a33\u5b9a\u6027\u5dee\u548c\u6536\u655b\u901f\u5ea6\u6162\u7684\u95ee\u9898\u3002\u7136\u800c\uff0c\u5c3d\u7ba1\u8fd9\u4e9b\u6280\u672f\u6539\u5584\u4e86\u7a33\u5b9a\u6027\uff0cDQN \u7684\u6536\u655b\u901f\u5ea6\u548c\u8bad\u7ec3\u8fc7\u7a0b\u7684\u7a33\u5b9a\u6027\u95ee\u9898\u4f9d\u7136\u5b58\u5728\uff0c\u7279\u522b\u662f\u5728\u590d\u6742\u7684\u73af\u5883\u4e2d\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn10wt\"><span style=\"font-size: 17px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnwg3\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span style=\"font-weight: bold\">7.4 \u6cdb\u5316\u80fd\u529b\u4e0e\u8fc7\u62df\u5408\u98ce\u9669<\/span><\/span><\/span><\/h3>\n<h3 style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnwg3\"><span style=\"font-size: 15px\"><span style=\", Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/span><\/h3>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn27w\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>DQN \u5728\u9762\u5bf9\u9ad8\u7ef4\u72b6\u6001\u7a7a\u95f4\u548c\u590d\u6742\u73af\u5883\u65f6\uff0c\u5bb9\u6613\u51fa\u73b0\u8fc7\u62df\u5408\u95ee\u9898\u3002\u5728\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\uff0cDQN \u901a\u8fc7\u5bf9\u5927\u91cf\u7684\u73af\u5883\u4ea4\u4e92\u8fdb\u884c\u5b66\u4e60\u6765\u66f4\u65b0 Q \u503c\u51fd\u6570\u3002\u7136\u800c\uff0c\u5728\u6709\u9650\u7684\u8bad\u7ec3\u6570\u636e\u4e0a\uff0cDQN \u53ef\u80fd\u4f1a\u8fc7\u5ea6\u62df\u5408\u67d0\u4e9b\u7279\u5b9a\u7684\u72b6\u6001\u548c\u52a8\u4f5c\uff0c\u4ece\u800c\u5931\u53bb\u5bf9\u672a\u77e5\u73af\u5883\u6216\u672a\u89c1\u8fc7\u72b6\u6001\u7684\u9002\u5e94\u80fd\u529b\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjncvz\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1p9q\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><span>\u8fd9\u79cd\u8fc7\u62df\u5408\u7684\u73b0\u8c61\u7279\u522b\u660e\u663e\u5728\u9ad8\u7ef4\u7a7a\u95f4\u6216\u591a\u53d8\u73af\u5883\u4e2d\uff0c\u667a\u80fd\u4f53\u7684\u6cdb\u5316\u80fd\u529b\u53d7\u5230\u9650\u5236\u3002\u5f53\u667a\u80fd\u4f53\u5728\u4e00\u4e2a\u6709\u9650\u7684\u8bad\u7ec3\u73af\u5883\u4e2d\u83b7\u5f97\u8bad\u7ec3\u540e\uff0c\u5176\u5b66\u5230\u7684\u7b56\u7565\u5728\u65b0\u7684\u6216\u7565\u5fae\u4e0d\u540c\u7684\u73af\u5883\u4e2d\u8868\u73b0\u8f83\u5dee\u3002\u4e3a\u4e86\u89e3\u51b3\u8fd9\u4e00\u95ee\u9898\uff0c\u63d0\u51fa\u4e86\u66f4\u5148\u8fdb\u7684\u6280\u672f\uff0c\u5982\u6b63\u5219\u5316\u3001\u81ea\u52a8\u8c03\u6574\u7f51\u7edc\u7ed3\u6784\u7b49\u65b9\u6cd5\uff0c\u4ee5\u589e\u5f3a\u6a21\u578b\u7684\u6cdb\u5316\u80fd\u529b\uff0c\u4f46\u8fd9\u4e9b\u65b9\u6cd5\u4ecd\u672a\u80fd\u5b8c\u5168\u6d88\u9664 DQN \u5728\u590d\u6742\u73af\u5883\u4e2d\u9762\u4e34\u7684\u8fc7\u62df\u5408\u98ce\u9669\u3002<\/span><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1p9q\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1p9q\"><span><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"0.5625\" data-s=\"300,640\" data-type=\"jpeg\" data-w=\"1280\" style=\"width: 100%\" data-backw=\"562\" data-backh=\"316\" data-imgfileid=\"100235450\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-901a70777f62704ff69d1ffb6fab0074.jpeg\" \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1p9q\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"margin-left: 8px;margin-right: 8px;margin-bottom: 0px;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1p9q\"><span style=\"font-size: 15px;, Arial, sans-serif;letter-spacing: 0.034em;font-style: normal;font-weight: normal\"><br \/><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span><br \/><\/span><\/span><\/p>\n<section style=\"margin: 0px;padding: 0px;max-width: 100%;font-family: PingFangSC-light;font-size: 15px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none\" data-pm-slice=\"0 0 []\">\n<section style=\"margin: 0px;padding: 0px 6px;max-width: 100%;width: 661px;vertical-align: top\">\n<section style=\"margin: 0px;padding: 0px;max-width: 100%;line-height: 1.4\">\n<p style=\"margin: 0px;padding: 0px;max-width: 100%;clear: both;min-height: 1em\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u53c2\u8003\u6587\u732e<\/span><\/strong><\/p>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"margin: 0px;padding: 0px;max-width: 100%;font-family: PingFangSC-light;font-size: 15px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-indent: 0px;text-transform: none;text-align: center;width: 661px\">\n<section style=\"margin: 0px;padding: 0px 0px 0px 4px;max-width: 100%;width: 661px;height: 360px;vertical-align: top\">\n<section style=\"margin: 0px;padding: 0px;max-width: 100%\">\n<section style=\"margin: 0px;padding: 0px;max-width: 100%;text-align: justify;font-size: 13px\">\n<p style=\"margin: 0px;padding: 0px;max-width: 100%;clear: both;min-height: 1em\"><span><br \/><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\" data-pm-slice=\"3 3 []\"><span style=\"font-size: 13px\"><span>1. Mnih, V.; Kavukcuoglu, K. (2015). &#8220;Human-level control through deep reinforcement learning&#8221;. Nature. 518 (7540): 529\u2013533. doi:10.1038\/nature14236. PMID 25719670.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>2. Overmars M G. Analyzing the convergence of Q-learning through Markov decision theory[D]. University of Twente, 2021.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>3. Even-Dar E, Mansour Y. Convergence of optimistic and incremental Q-learning[J]. Advances in neural information processing systems, 2001, 14.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>4. Van Hasselt H, Guez A, Silver D. Deep reinforcement learning with double q-learning[C]\/\/Proceedings of the AAAI conference on artificial intelligence. 2016, 30(1).<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>5. Wang Z, Schaul T, Hessel M, et al. Dueling network architectures for deep reinforcement learning[C]\/\/International conference on machine learning. PMLR, 2016: 1995-2003.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>6. Hausknecht M J, Stone P. Deep Recurrent Q-Learning for Partially Observable MDPs[C]\/\/AAAI fall symposia. 2015, 45: 141.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>7. Sun, Huihui; Zhang, Weijie; Yu, Runxiang; Zhang, Yujie (2021). &#8220;Motion planning for mobile robots\u2014Focusing on deep reinforcement learning: A systematic review&#8221;. IEEE Access. IEEE. 9: 69061\u201369081. doi:10.1109\/ACCESS.2021.3076530.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>8. Tai, Lei; Paolo, Giuseppe; Liu, Ming (2017). &#8220;Virtual-to-real deep reinforcement learning: Continuous control of mobile robots for mapless navigation&#8221;. IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS). IEEE: 31\u201336. doi:10.1109\/IROS.2017.8202134.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>9. Wang, Y.; Sun, J.; He, H.; Sun, C. (2020). &#8220;Deterministic policy gradient with integral compensator for robust quadrotor control&#8221;. IEEE Transactions on Systems, Man, and Cybernetics: Systems. IEEE. 50 (10): 3713\u20133725. doi:10.1109\/TSMC.2020.3002218.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>10. Barron, T.; Whitehead, M.; Yeung, A. (2016). Deep reinforcement learning in a 3-D blockworld environment. IJCAI\/AAAI Press. pp. 1\u20136. {{cite conference}}: Unknown parameter |booktitle= ignored (help)<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>11. Li, H.; Zhang, Q.; Zhao, D. (2020). &#8220;Deep reinforcement learning-based automatic exploration for navigation in unknown environment&#8221;. IEEE Transactions on Neural Networks and Learning Systems. IEEE. 31 (6): 2064\u20132076. doi:10.1109\/TNNLS.2019.2930059.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>12. Kang, Kyunghoon; Belkhale, Suneel; Kahn, Gregory; Abbeel, Pieter; Levine, Sergey (2019). &#8220;Generalization through simulation: Integrating simulated and real data into deep reinforcement learning for vision-based autonomous flight&#8221;. IEEE International Conference on Robotics and Automation (ICRA). IEEE: 6008\u20136014. doi:10.1109\/ICRA.2019.8793701.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>13. {Chen, Xiaocong and Yao, Lina and McAuley, Julian and Zhou, Guanglin and Wang, Xianzhi} (2021). &#8220;A survey of deep reinforcement learning in recommender systems: A systematic review and future directions&#8221;. arXiv preprint: arXiv:2109.03540.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>14. Lillicrap, T. P., Hunt, J. J., Pritzel, A., Heess, N., Erez, T., Tassa, Y., &#8230; &amp; Wierstra, D. (2015). Continuous control with deep reinforcement learning. arXiv preprint arXiv:1509.02971.<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>15. Hessel, M., Modayil, J., Van Hasselt, H., Schaul, T., Ostrovski, G., Dabney, W., &#8230; &amp; Silver, D. (2018, April). Rainbow: Combining improvements in deep reinforcement learning. In Proceedings of the AAAI conference on artificial intelligence (Vol. 32, No. 1).<\/span><\/span><\/p>\n<p style=\"text-align: left;margin-left: 8px;margin-right: 8px;line-height: 1.5em;margin-bottom: 8px\"><span style=\"font-size: 13px\"><span>16. Schulman, J., Wolski, F., Dhariwal, P., Radford, A., &amp; Klimov, O. (2017). Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347.<\/span><\/span><\/p>\n<p style=\"margin: 0px;padding: 0px;max-width: 100%;clear: both;min-height: 1em\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span><br \/><\/span><\/span><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"margin: 3px 0px 0px;padding: 0px;max-width: 100%;font-family: PingFangSC-light;font-size: 15px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none\">\n<section style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 14px;letter-spacing: 1px\">\n<p style=\"margin: 0px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;text-align: center\"><span>\u53c2\u8003\u6587\u732e\u53ef<\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u4e0a\u4e0b\u6ed1\u52a8<\/span><\/strong><span>\u67e5\u770b<\/span><\/p>\n<\/section>\n<\/section>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px\" data-mpa-action-id=\"mel6pxjn1mmr\"><span><br \/><\/span><\/p>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px\" data-mpa-action-id=\"mel6pxjn235z\"><span><br \/><\/span><\/p>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px\" data-mpa-action-id=\"mel6pxjn235z\"><span style=\"font-size: 15px\" data-mpa-action-id=\"mel7ybph16u5\" data-pm-slice=\"0 0 []\"><span style=\"font-weight: bold\">\u4f5c\u8005\u7b80\u4ecb<\/span><\/span><\/p>\n<section style=\"text-align: center;margin-left: 8px;margin-right: 8px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-imgfileid=\"100235400\" data-ratio=\"0.5625\" data-s=\"300,640\" data-type=\"jpeg\" data-w=\"800\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-63b92c29b4c3ade63d7d5d2e6eb3def9.jpeg\"><\/section>\n<section style=\"text-align: center;margin-left: 8px;margin-right: 8px\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"0.562962962962963\" data-s=\"300,640\" data-type=\"jpeg\" data-w=\"1080\" data-imgfileid=\"100235401\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-841bca4e122f8aea1ddd72ca6c943d3f.jpeg\" \/><\/section>\n<section data-mpa-action-id=\"mel6pxjn1oio\"><span><br \/><\/span><\/section>\n<blockquote>\n<p><span>\u672c\u8bcd\u6761\u7531\u96c6\u667a\u4ff1\u4e50\u90e8\u4f17\u5305\u751f\u4ea7\uff0c\u96be\u514d\u5b58\u5728\u7eb0\u6f0f\u548c\u95ee\u9898\uff0c\u6b22\u8fce\u5927\u5bb6\u7559\u8a00\u53cd\u9988\uff0c\u4e00\u7ecf\u91c7\u7eb3\uff0c\u53ef\u4ee5\u83b7\u5f97\u5bf9\u5e94\u7684\u79ef\u5206\u5956\u52b1\u5662\uff01<\/span><\/p>\n<\/blockquote>\n<section style=\"margin-bottom: 0px\" data-mpa-action-id=\"mel6pxjnpml\"><span style=\", Arial, sans-serif;font-size: 15px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;float: none\" data-pm-slice=\"0 0 []\"><span><br \/><\/span><\/span><\/section>\n<section style=\"margin: 0px;padding: 0px;max-width: 100%;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none\" data-pm-slice=\"0 0 []\" data-mpa-action-id=\"mel6pxjnjck\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><br \/><\/span><\/section>\n<section style=\"margin: 10px 0px 0px;padding: 0px;max-width: 100%;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-indent: 0px;text-transform: none;, Arial, sans-serif;font-size: 14px;text-align: center;justify-content: center\" data-mpa-action-id=\"mel6pxjnxf9\">\n<section style=\"margin: 0px;padding: 0px;max-width: 100%;width: auto;vertical-align: top;min-width: 10%;height: auto\">\n<section style=\"margin: 0px 0px -15px;padding: 0px;max-width: 100%\">\n<section style=\"margin: 0px;padding: 0px 10px;max-width: 100%;font-size: 16px;line-height: 2;letter-spacing: 3px\">\n<p style=\"margin: 0px;padding: 0px;max-width: 100%;clear: both;min-height: 1em\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\">\u52a0\u5165\u6211\u4eec<\/span><\/strong><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"margin: 0px 8px;padding: 0px;max-width: 100%;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;, Arial, sans-serif;font-size: 14px;clear: both;min-height: 1em;line-height: 2em\" data-mpa-action-id=\"mel6pxjn88o\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><br \/><\/span><\/section>\n<p data-pm-slice=\"0 0 []\" data-mpa-action-id=\"mel6pxjnin6\" style=\"margin: 0px 8px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u4eb2\u7231\u7684\u793e\u533a\u4f19\u4f34\u4e0e\u77e5\u8bc6\u63a2\u7d22\u8005\uff1a<\/span><\/span><\/strong><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1q73\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u6211\u4eec\u8bda\u631a\u9080\u8bf7\u70ed\u7231\u77e5\u8bc6\u5206\u4eab\u7684\u60a8\uff0c\u52a0\u5165<\/span><\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u96c6\u667a\u767e\u79d1\u8bcd\u6761\u7f16\u5199\u5fd7\u613f\u56e2\u961f<\/span><\/span><\/strong><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\uff01\u65e0\u8bba\u60a8\u662f\u9886\u57df\u4e13\u5bb6\uff0c\u8fd8\u662f\u5bf9\u7279\u5b9a\u4e3b\u9898\u5145\u6ee1\u70ed\u5ff1\u7684\u5b66\u4e60\u8005\uff0c\u8fd9\u91cc\u90fd\u6709\u60a8\u7684\u821e\u53f0\u3002\u901a\u8fc7\u7f16\u5199\u767e\u79d1\u8bcd\u6761\uff0c\u60a8\u5c06\u4e3a\u5168\u7403\u8bfb\u8005\u4f20\u9012\u6743\u5a01\u77e5\u8bc6\uff0c\u540c\u65f6\u83b7\u5f97<\/span><\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u4e13\u5bb6\u6307\u5bfc<\/span><\/span><\/strong><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u4e0e<\/span><\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u4e2a\u4eba\u80fd\u529b<\/span><\/span><\/strong><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u8dc3\u5347\u7684\u53cc\u91cd\u6210\u957f\u3002<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1hr1\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><br \/><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1qpb\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\ud83d\udcdd&nbsp;<\/span><\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u5fd7\u613f\u8005\u804c\u8d23<\/span><\/span><\/strong><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnfva\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u521b\u4f5c\u65b0\u8bcd\u6761\uff1a<\/span><\/span><\/strong><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u8986\u76d6\u590d\u6742\u7cfb\u7edf\u3001\u4eba\u5de5\u667a\u80fd\u7b49\u524d\u6cbf\u9886\u57df<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn2vi\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u8fed\u4ee3\u7ecf\u5178\u5185\u5bb9<\/span><\/span><\/strong><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\uff1a\u66f4\u65b0\u73b0\u6709\u8bcd\u6761\uff0c\u5b88\u62a4\u77e5\u8bc6\u7684\u51c6\u786e\u6027\u4e0e\u65f6\u6548\u6027<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn9z\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u8d28\u91cf\u5b88\u62a4\u8005<\/span><\/span><\/strong><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\uff1a\u53c2\u4e0e\u5185\u5bb9\u6821\u5bf9\u5ba1\u6838\uff0c\u5171\u5efa\u7cbe\u54c1\u77e5\u8bc6\u5e93<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1sxm\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><br \/><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn450\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\ud83c\udf1f&nbsp;<\/span><\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u6211\u4eec\u671f\u5f85\u60a8<\/span><\/span><\/strong><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1pzs\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"font-weight: bold\">\u96c6\u667a\u8bfb\u4e66\u4f1a\u6210\u5458\uff08\u9700\u5b8c\u6210\u5171\u521b\u4efb\u52a1\u5e76\u83b7\u5f97\u9000\u8d39\u8d44\u683c\uff09<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn7ew\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u62e5\u6709\u6e05\u6670\u8868\u8fbe\u590d\u6742\u6982\u5ff5\u7684\u5199\u4f5c\u80fd\u529b<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn97l\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u5bf9\u7279\u5b9a\u9886\u57df\u6709\u6df1\u5ea6\u7814\u7a76\u6216\u5f3a\u70c8\u5174\u8da3<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnxd0\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u5177\u5907\u4fe1\u606f\u68c0\u7d22\u4e0e\u6574\u5408\u7d20\u517b<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnqmy\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u6000\u63e3\u8d23\u4efb\u611f\u4e0e\u534f\u4f5c\u7cbe\u795e\uff0c\u613f\u4e3a\u77e5\u8bc6\u5171\u4eab\u8d4b\u80fd<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnirr\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><br \/><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1zcv\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\ud83c\udf81&nbsp;<\/span><\/span><strong style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span>\u60a8\u5c06\u6536\u83b7<\/span><\/span><\/strong><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjnp3y\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u767e\u79d1\u79ef\u5206\uff08\u652f\u6301\u5151\u6362\u96c6\u667a\u4ff1\u4e50\u90e8\u5468\u8fb9\uff1a\u6587\u5316\u886b\u3001\u590d\u6742\u79d1\u5b66\u77e5\u8bc6\u5361\u7b49\uff09<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn1dwx\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u96c6\u667a\u4ff1\u4e50\u90e8\u521b\u59cb\u4eba\u5f20\u6c5f\u6559\u6388\u4eb2\u81ea\u6307\u5bfc\u5199\u4f5c<\/span><\/span><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;line-height: 1.75em\" data-mpa-action-id=\"mel6pxjn16ub\"><span style=\"margin: 0px;padding: 0px;max-width: 100%;font-size: 15px\"><span>\u79d1\u7814\u52a9\u7406\u664b\u5347\u901a\u9053\uff1a\u8868\u73b0\u4f18\u5f02\u8005\u53ef\u52a0\u5165\u5f20\u6c5f\u6559\u6388\u79d1\u7814\u56e2\u961f<\/span><\/span><\/p>\n<section style=\"margin: 0px 8px 24px;padding: 0px;max-width: 100%;, Arial, sans-serif;font-size: 17px;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-indent: 0px;text-transform: none;line-height: 1.75em;text-align: center\" data-mpa-action-id=\"mel6pxjn1ot\"><img alt=\"\u56fe\u7247\" class=\"rich_pages wxw-img\" data-ratio=\"0.42736842105263156\" data-type=\"png\" data-w=\"950\" style=\"margin: 0px;padding: 0px;max-width: 100%;vertical-align: bottom;height: auto !important;width: 661px !important;background-color: transparent\" data-width=\"950\" data-height=\"406\" data-imgfileid=\"100232724\" src=\"\" \/><\/section>\n<section style=\"text-align: center;margin-bottom: 0px\" data-mpa-action-id=\"mel6pxjn21ut\"><img class=\"rich_pages wxw-img js_insertlocalimg\" data-ratio=\"0.950920245398773\" data-s=\"300,640\" data-type=\"jpeg\" data-w=\"652\" style=\"width: 158px;height: 150px;background-color: transparent\" data-imgfileid=\"100233783\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-a09585cab4f8d6396030dec9b1e9078f-3.jpeg\" \/><\/section>\n<p data-mpa-action-id=\"mel6pxjn22px\" data-pm-slice=\"0 0 []\" style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;, Arial, sans-serif;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-indent: 0px;text-transform: none;line-height: 1.6em;font-size: 13px;text-align: center\"><span><span>\u52a0\u5165\u5f20\u6c5f\u7ec4\u53d1\u8d77\u7684\u4efb\u4f55\u4e00\u671f\u8bfb\u4e66\u4f1a\u5e76\u5b8c\u6210\u5171\u521b\u4efb\u52a1\u5373\u53ef \u8ba9\u6211\u4eec\u4e00\u8d77\uff0c\u7528\u77e5\u8bc6\u8fde\u63a5\u4e16\u754c\uff01<\/span><\/span><\/p>\n<section style=\"margin-bottom: 0px;letter-spacing: 0.544px;font-size: 14px;, Arial, sans-serif\" data-pm-slice=\"6 6 []\">\n<h1 style=\"margin-bottom: 5px;letter-spacing: 0.544px;font-size: 14px;, Arial, sans-serif\"><span style=\"font-size: 16px\"><strong><span style=\"font-size: 16px\"><span><br \/><\/span><\/span><\/strong><\/span><\/h1>\n<p><span style=\"font-size: 16px\"><strong><span style=\"font-size: 16px\"><span><br \/><\/span><\/span><\/strong><\/span><\/p>\n<section style=\"margin-top: 10px;margin-bottom: 0px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;text-align: center;justify-content: center\">\n<section style=\"width: auto;vertical-align: top;min-width: 10%;height: auto\">\n<section style=\"margin-bottom: -15px\">\n<section style=\"padding-right: 10px;padding-left: 10px;font-size: 16px;line-height: 2;letter-spacing: 3px\">\n<p><strong><span>\u81ea\u7531\u80fd\u539f\u7406\u4e0e\u5f3a\u5316\u5b66\u4e60\u8bfb\u4e66\u4f1a<\/span><\/strong><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;line-height: 1.75em\"><span><br \/><\/span><\/p>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;line-height: 2em\"><span style=\"font-size: 15px;letter-spacing: 0.544px\"><span>\u81ea\u7531\u80fd\u539f\u7406\u88ab\u8ba4\u4e3a\u662f\u201c\u81ea\u8fbe\u5c14\u6587\u81ea\u7136\u9009\u62e9\u7406\u8bba\u540e\u6700\u5305\u7f57\u4e07\u8c61\u7684\u601d\u60f3\u201d\uff0c\u5b83\u8bd5\u56fe\u4ece\u7269\u7406\u3001\u751f\u7269\u548c\u5fc3\u667a\u7684\u89d2\u5ea6\u63d0\u4f9b\u667a\u80fd\u4f53\u611f\u77e5\u548c\u884c\u52a8\u7684\u7edf\u4e00\u6027\u89c4\u5f8b\uff0c\u4ece\u7b2c\u4e00\u6027\u539f\u7406\u51fa\u53d1\u89e3\u91ca\u667a\u80fd\u4f53\u66f4\u65b0\u8ba4\u77e5\u3001\u63a2\u7d22\u548c\u6539\u53d8\u4e16\u754c\u7684\u673a\u5236\uff0c\u4ece\u800c\u5bf9\u4eba\u5de5\u667a\u80fd\uff0c\u7279\u522b\u662f\u5f3a\u5316\u5b66\u4e60\u4e16\u754c\u6a21\u578b\u3001\u901a\u7528\u4eba\u5de5\u667a\u80fd\u7814\u7a76\u5177\u6709\u91cd\u8981\u542f\u53d1\u610f\u4e49\u3002<\/span><\/span><\/section>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;line-height: 2em\"><span><br \/><\/span><\/p>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;line-height: 2em\"><span style=\"font-size: 15px\"><span>\u96c6\u667a\u4ff1\u4e50\u90e8\u8054\u5408\u5317\u4eac\u5e08\u8303\u5927\u5b66\u7cfb\u7edf\u79d1\u5b66\u5b66\u9662\u535a\u58eb\u751f\u725f\u7267\u4e91\uff0c\u5357\u4eac\u822a\u7a7a\u822a\u5929\u5927\u5b66\u526f\u6559\u6388\u4f55\u771f\uff0c\u4ee5\u53ca\u9aa5\u667a\u667a\u80fd\u79d1\u6280\u7b97\u6cd5\u5de5\u7a0b\u5e08\u3001\u516c\u4f17\u53f7 CreateAMind \u4e3b\u7f16\u5f20\u5fb7\u7965\uff0c\u5171\u540c\u53d1\u8d77\u300c<a class=\"normal_text_link\" target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247684648&amp;idx=1&amp;sn=31d359ae9b22f282bca47889e403764e&amp;chksm=e89948a5dfeec1b3c61a686df6920c48a55dfe3d59dd974827877cf3d6b83922e42cd58dc591&amp;scene=21#wechat_redirect\" data-itemshowtype=\"0\" data-linktype=\"2\" rel=\"noopener noreferrer\">\u81ea\u7531\u80fd\u539f\u7406\u4e0e\u5f3a\u5316\u5b66\u4e60\u8bfb\u4e66\u4f1a<\/a>\u300d\uff0c\u5e0c\u671b\u63a2\u8ba8\u81ea\u7531\u80fd\u539f\u7406\u3001\u5f3a\u5316\u5b66\u4e60\u4e16\u754c\u6a21\u578b\uff0c\u4ee5\u53ca\u8111\u4e0e\u610f\u8bc6\u95ee\u9898\u4e2d\u7684\u9884\u6d4b\u52a0\u5de5\u7406\u8bba\u7b49\u524d\u6cbf\u4ea4\u53c9\u95ee\u9898\uff0c\u63a2\u7d22\u8fd9\u4e9b\u4e0d\u540c\u9886\u57df\u80cc\u540e\u8574\u542b\u7684\u611f\u77e5\u548c\u884c\u52a8\u7684\u7edf\u4e00\u539f\u7406\u3002<\/span><span style=\"font-size: 15px;letter-spacing: 0.544px;, Arial, sans-serif\"><span>\u8bfb\u4e66\u4f1a\u5df2\u5b8c\u7ed3\uff0c\u73b0\u5728\u62a5\u540d\u53ef\u52a0\u5165\u793e\u7fa4\u5e76\u89e3\u9501\u56de\u653e\u89c6\u9891\u6743\u9650\u3002<\/span><\/span><\/span><\/p>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;line-height: 2em\"><span style=\"font-size: 15px\"><span><br \/><\/span><\/span><\/p>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;line-height: 2em\"><span style=\"font-size: 15px\"><span class=\"js_jump_icon h5_image_link\"><span><img class=\"rich_pages wxw-img\" data-ratio=\"0.5714285714285714\" data-w=\"1050\" style=\"width: 100%;height: auto\" data-backw=\"562\" data-backh=\"321\" data-imgfileid=\"100203797\" src=\"\/wp-content\/uploads\/2025\/08\/wxsync-2025-08-296b5deefd0b2df9cabd83017a7b7d8c.png\" \/><\/span><\/span><\/span><\/p>\n<p><span><br \/><\/span><\/p>\n<section style=\"margin-right: 8px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px;margin-bottom: 0px\"><span style=\", Arial, sans-serif;font-size: 15px;letter-spacing: 0.578px\"><span>\u8be6\u60c5\u8bf7\u89c1\uff1a<\/span><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px\"><span style=\", Arial, sans-serif;font-size: 15px;letter-spacing: 0.578px;text-decoration: underline\"><span><a class=\"normal_text_link\" target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247684648&amp;idx=1&amp;sn=31d359ae9b22f282bca47889e403764e&amp;chksm=e89948a5dfeec1b3c61a686df6920c48a55dfe3d59dd974827877cf3d6b83922e42cd58dc591&amp;scene=21#wechat_redirect\" data-itemshowtype=\"0\" data-linktype=\"2\" rel=\"noopener noreferrer\">\u81ea\u7531\u80fd\u539f\u7406\u4e0e\u5f3a\u5316\u5b66\u4e60\u8bfb\u4e66\u4f1a\u542f\u52a8\uff1a\u63a2\u7d22\u611f\u77e5\u548c\u884c\u52a8\u7684\u7edf\u4e00\u539f\u7406<\/a><\/span><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px\"><span><br \/><\/span><\/section>\n<\/section>\n<p style=\"margin-right: 8px;margin-bottom: 5px;margin-left: 8px\" data-mpa-action-id=\"mel6pxjn1wbu\"><span><br \/><\/span><\/p>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjntg1\"><strong style=\"letter-spacing: 0.544px\"><strong style=\"letter-spacing: 0.544px;font-size: 16px;text-align: center;, Arial, sans-serif\"><strong style=\"text-align: left;font-family: PingFangSC-light;letter-spacing: 0.544px\"><span style=\"font-size: 15px;letter-spacing: 0.544px\"><span>\u63a8\u8350\u9605\u8bfb<\/span><\/span><\/strong><\/strong><\/strong><\/p>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjn1z2z\"><strong><span>1.&nbsp;<a class=\"normal_text_link\" target=\"_blank\" href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247718843&amp;idx=1&amp;sn=5ba4e603bdd9bb15de51abb092eb88b8&amp;scene=21#wechat_redirect\" data-itemshowtype=\"0\" data-linktype=\"2\" rel=\"noopener noreferrer\"><span style=\"text-decoration: underline\">\u57fa\u4e8e\u4e16\u754c\u6a21\u578b\u7684\u5f3a\u5316\u5b66\u4e60\u6846\u67b6: \u505a\u68a6\u8005\uff5c\u96c6\u667a\u767e\u79d1<\/span><\/a><\/span><\/strong><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjn1v3o\"><strong style=\"letter-spacing: 0.544px\"><span>2.&nbsp;<a class=\"normal_text_link\" target=\"_blank\" href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247667549&amp;idx=2&amp;sn=ee49b9613049a5dc2e152fdabcda1092&amp;scene=21#wechat_redirect\" data-itemshowtype=\"11\" data-linktype=\"2\" rel=\"noopener noreferrer\"><span style=\"text-decoration: underline\">\u5f3a\u5316\u5b66\u4e60\uff1a\u5173\u4e8e\u884c\u52a8\u7684\u667a\u80fd | \u4fde\u626c<\/span><\/a><\/span><\/strong><span style=\"text-decoration: underline\"><strong style=\"letter-spacing: 0.544px\"><span><br \/><\/span><\/strong><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjn1xb0\"><strong style=\"letter-spacing: 0.544px\"><span>3.&nbsp;<a class=\"normal_text_link\" target=\"_blank\" href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485818&amp;idx=2&amp;sn=e1ee216064c0067b8dd4197fd84469d7&amp;scene=21#wechat_redirect\" data-itemshowtype=\"0\" data-linktype=\"2\" rel=\"noopener noreferrer\"><span style=\"text-decoration: underline\">AI\u6253\u6e38\u620f\u80cc\u540e\u7684\u6280\u672f\u539f\u7406 | \u5f20\u6c5f<\/span><\/a><\/span><\/strong><span style=\"text-decoration: underline\"><strong style=\"letter-spacing: 0.544px\"><span><br \/><\/span><\/strong><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif;font-size: 14px\" data-pm-slice=\"4 5 []\" data-mpa-action-id=\"mel6pxjn244t\"><span><strong style=\"letter-spacing: 0.544px\"><span><span style=\"text-decoration: none\">4.&nbsp;<\/span><a class=\"normal_text_link\" target=\"_blank\" href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247710871&amp;idx=1&amp;sn=f572fc0ff9abbc6b32185b835ed39122&amp;scene=21#wechat_redirect\" data-itemshowtype=\"0\" data-linktype=\"2\" rel=\"noopener noreferrer\"><span style=\"text-decoration: underline\">\u6d8c\u73b0\u52a8\u529b\u5b66\u5982\u4f55\u7528\u6765\u5206\u6790\u590d\u6742\u7cfb\u7edf\uff1f | \u65b0\u8bfe\u4e0a\u7ebf<\/span><\/a><\/span><\/strong><\/span><span style=\"margin: 0px;padding: 0px;max-width: 100%;text-decoration: underline\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;letter-spacing: 0.544px\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><br \/><\/span><\/strong><\/strong><\/span><\/section>\n<section style=\"margin: 0px 8px 8px;padding: 0px;max-width: 100%;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjn226z\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;letter-spacing: 0.544px\"><\/strong><strong style=\"margin: 0px;padding: 0px;max-width: 100%;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\">5.&nbsp;<\/span><\/strong><strong style=\"margin: 0px;padding: 0px;max-width: 100%;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><a class=\"normal_text_link\" target=\"_blank\" href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247715376&amp;idx=2&amp;sn=e9b6f441a1a3615be72bb0b60594c015&amp;scene=21#wechat_redirect\" data-itemshowtype=\"11\" data-linktype=\"2\" rel=\"noopener noreferrer\"><span style=\"text-decoration: underline\">\u96c6\u667a\u5b66\u56ed\u7cbe\u54c1\u8bfe\u7a0b\u514d\u8d39\u5f00\u653e\uff0c\u89e3\u9501\u7cfb\u7edf\u79d1\u5b66\u4e0e AI \u65b0\u4e16\u754c<\/span><\/a><\/span><\/strong><\/section>\n<p style=\"margin: 0px 8px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjnvrn\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\">6.&nbsp;<a class=\"normal_text_link\" target=\"_blank\" href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247716932&amp;idx=1&amp;sn=1fcb8a78a7f0157ad35a15d99f7ee9c1&amp;scene=21#wechat_redirect\" data-itemshowtype=\"0\" data-linktype=\"2\" rel=\"noopener noreferrer\"><span style=\"text-decoration: underline\">\u9ad8\u8003\u5206\u6570\u53ea\u662f\u5f20\u5165\u573a\u5238\uff0c\u4f60\u7684\u79d1\u7814\u5192\u9669\u5728\u8fd9\u91cc\u542f\u822a\uff01<\/span><\/a><\/span><\/strong><\/p>\n<p style=\"margin: 0px 8px;padding: 0px;max-width: 100%;clear: both;min-height: 1em;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjn43m\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%\"><strong data-pm-slice=\"0 0 []\" style=\"margin: 0px;padding: 0px;max-width: 100%;, Arial, sans-serif;font-size: 14px;font-style: normal;text-align: justify;text-indent: 0px;text-transform: none;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span style=\"text-decoration: none\">7.<\/span><\/span><\/strong><\/strong><\/span><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%\"><strong data-pm-slice=\"0 0 []\" style=\"margin: 0px;padding: 0px;max-width: 100%;, Arial, sans-serif;font-size: 14px;font-style: normal;text-align: justify;text-indent: 0px;text-transform: none;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><span style=\"text-decoration: none\">&nbsp;<\/span><\/span><\/strong><\/strong><\/span><span style=\"margin: 0px;padding: 0px;max-width: 100%;text-decoration: underline\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%\"><strong data-pm-slice=\"0 0 []\" style=\"margin: 0px;padding: 0px;max-width: 100%;, Arial, sans-serif;font-size: 14px;font-style: normal;text-align: justify;text-indent: 0px;text-transform: none;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><a class=\"normal_text_link\" target=\"_blank\" href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247714367&amp;idx=1&amp;sn=a53ea91c122b2f82d5e0840d521d24a6&amp;scene=21#wechat_redirect\" data-itemshowtype=\"0\" data-linktype=\"2\" rel=\"noopener noreferrer\">\u7cfb\u7edf\u79d1\u5b66\u524d\u6cbf\u5341\u8bb2\uff1a\u7406\u89e3\u81ea\u7136\u3001\u751f\u547d\u4e0e\u793e\u4f1a\u7684\u590d\u6742\u6027<\/a><\/span><\/strong><\/strong><\/span><\/p>\n<section data-pm-slice=\"0 0 []\" style=\"margin: 0px 8px 8px;padding: 0px;max-width: 100%;font-style: normal;font-weight: 400;letter-spacing: 0.544px;text-align: justify;text-indent: 0px;text-transform: none;, Arial, sans-serif;font-size: 14px\" data-mpa-action-id=\"mel6pxjnk71\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><strong style=\"margin: 0px;padding: 0px;max-width: 100%;letter-spacing: 0.544px\"><span style=\"margin: 0px;padding: 0px;max-width: 100%\"><br \/><\/span><\/strong><\/span><\/section>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;letter-spacing: 0.544px;, Arial, sans-serif\" data-mpa-action-id=\"mel6pxjnmrc\"><span><br \/><\/span><\/p>\n<p style=\"margin-bottom: 0px;letter-spacing: 0.544px;font-size: 14px;, Arial, sans-serif\" data-mpa-action-id=\"mel6pxjnzpp\"><strong style=\"letter-spacing: 0.544px;font-size: 15px;text-align: left;font-family: PingFangSC-light\"><span><span>\u70b9\u51fb\u201c\u9605\u8bfb\u539f\u6587\u201d\uff0c<\/span><strong style=\"letter-spacing: 0.544px\"><span><strong style=\"letter-spacing: 0.544px\"><span>\u62a5\u540d\u8bfb\u4e66\u4f1a<\/span><\/strong><\/span><\/strong><\/span><\/strong><\/p>\n<\/p>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>\u5bfc\u8bed \u6df1\u5ea6Q\u7f51\u7edc(Deep Q-Network, DQN)\u662f\u4e00\u79cd\u57fa\u4e8e\u6df1\u5ea6\u5b66\u4e60\u7684\u5f3a\u5316\u5b66\u4e60\u7b97\u6cd5\uff0c\u5b83\u901a\u8fc7\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u6765\u8fd1\u4f3c\u6700\u4f18\u52a8\u4f5c\u4ef7\u503c\u51fd\u6570\uff08Q\u51fd\u6570\uff09\uff0c\u80fd\u591f\u76f4\u63a5\u4ece\u9ad8\u7ef4\u611f\u77e5\u8f93\u5165\uff08\u5982\u6e38\u620f\u753b\u9762\u50cf\u7d20\uff09\u4e2d\u5b66\u4e60\u6700\u4f18\u51b3\u7b56\u7b56\u7565\u3002\u8be5\u7b97\u6cd5\u7684\u6838\u5fc3\u521b\u65b0\u5728\u4e8e\u7ed3\u5408\u4e86\u7ecf\u9a8c\u56de\u653e\u673a\u5236\u548c\u76ee\u6807\u7f51\u7edc\u6280\u672f\uff0c\u6709\u6548\u89e3\u51b3\u4e86\u4f20\u7edfQ\u5b66\u4e60\u5728\u975e\u7ebf\u6027\u51fd\u6570\u903c\u8fd1\u4e2d\u7684\u7a33&#8230;<\/p>\n","protected":false},"author":0,"featured_media":63790,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[1],"tags":[],"special":[],"_links":{"self":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts\/63835"}],"collection":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/types\/post"}],"replies":[{"embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=63835"}],"version-history":[{"count":0,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts\/63835\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/media\/63790"}],"wp:attachment":[{"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=63835"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=63835"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=63835"},{"taxonomy":"special","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fspecial&post=63835"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}