{"id":4739,"date":"2017-06-24T01:00:00","date_gmt":"2017-06-23T17:00:00","guid":{"rendered":"http:\/\/swarma.org\/%swarma-paper%\/"},"modified":"2018-12-06T00:33:45","modified_gmt":"2018-12-05T16:33:45","slug":"%e6%b5%85%e8%b0%88%e5%bc%ba%e5%8c%96%e5%ad%a6%e4%b9%a0-%e6%9c%b1%e7%91%9e%e9%b9%a4","status":"publish","type":"post","link":"https:\/\/swarma.org\/?p=4739","title":{"rendered":"\u6d45\u8c08\u5f3a\u5316\u5b66\u4e60 | \u6731\u745e\u9e64"},"content":{"rendered":"<div class=\"bpp-post-content\">\n<section class=\"xmteditor\" style=\"display:none;\"  ><\/section>\n<section  style=\"display: none; height: 0px;\"><\/section>\n<div class=\"post-image\"><img      src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma4-1534232142.jpg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/div>\n<section  class=\"mpa-template\"  style=\"margin-left: 0.5em; margin-right: 0.5em;\">\n<section donone=\"shifuMouseDownCard(&#39;shifu_c_029&#39;)\" label=\"Copyright Reserved by PLAYHUDONG.\" style=\"margin: 1em 0px; padding: 0px; max-width: 100%; color: rgb(123, 12, 0); font-size: 16px; white-space: normal; line-height: 25.6px; border-width: 0px; border-style: none; background-color: rgb(255, 255, 255); border-color: rgb(123, 12, 0); box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\">\n<p style=\"margin: 10px 0px 0px 1em; padding: 0px; max-width: 100%; line-height: 1.4; border-color: rgb(123, 12, 0); box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\"><span style=\"margin: 0px; padding: 0px; max-width: 100%; font-size: 14px; border-color: rgb(123, 12, 0); color: rgb(255, 255, 255); box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\"><strong style=\"margin: 0px; padding: 0px; max-width: 100%; border-color: rgb(123, 12, 0); box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\"><span style=\"font-size: 14px; border-color: rgb(123, 12, 0); margin: 0px; padding: 0.2em 0.5em; max-width: 100%; font-weight: inherit; text-decoration: inherit; border-radius: 0.3em; text-align: center; background-color: rgb(123, 12, 0); box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\">\u5bfc\u8bed<\/span><\/strong><\/span><\/p>\n<section class=\"\" style=\"margin: -0.7em 0px 0px; padding: 0px; max-width: 100%; border-width: 1px; border-style: solid; border-color: rgb(123, 12, 0); border-radius: 0.4em; color: rgb(123, 12, 0); font-size: 1em; box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\">\n<section style=\"margin: 0px; padding: 1.4em 1em 1em; max-width: 100%; border-color: rgb(123, 12, 0); box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\">\n<section style=\"margin: 0px; padding: 0px; max-width: 100%; font-size: 1em; font-weight: inherit; text-align: inherit; text-decoration: inherit; border-color: rgb(123, 12, 0); box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important;\">\n<p style=\"max-width: 100%; clear: both; min-height: 1em; border-color: rgb(123, 12, 0); text-align: left; margin-top: 10px; box-sizing: border-box !important; word-wrap: break-word !important; overflow-wrap: break-word !important; letter-spacing: 0.5px;\"><span style=\"color: rgb(136, 136, 136); font-size: 13px; font-weight: inherit; text-decoration: inherit; text-align: inherit;\"><\/span><\/p>\n<p style=\"letter-spacing: 0.5px;\"><span style=\"font-weight: inherit; text-align: inherit; text-decoration: inherit; font-size: 13px; color: rgb(136, 136, 136);\">\u524d\u4e9b\u65e5\u5b50AlphaGo\u4ee5\u4e00\u201c\u4eba\u201d\u4e4b\u529b\u6a2a\u626b\u4e86\u56fd\u5185\u51e0\u5927\u9876\u5c16\u56f4\u68cb\u9ad8\u624b\u7684\u4e8b\u60c5\uff0c\u76f8\u4fe1\u5728\u6c5f\u6e56\u4e0a\u5df2\u7ecf\u65e0\u4eba\u4e0d\u77e5\u65e0\u4eba\u4e0d\u6653\u4e86\u3002<\/span><\/p>\n<p style=\"margin-top: 10px; margin-bottom: 10px; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(136, 136, 136);\">\u65b0\u95fb\u4e4b\u5916\uff0c\u5982\u679c\u4f60\u5bf9AlphaGo\u7684\u5b9e\u73b0\u6280\u672f\u611f\u5174\u8da3\uff0c\u76f8\u4fe1\u4f60\u4e5f\u5df2\u7ecf\u542c\u8bf4\u8fc7\u201c\u5f3a\u5316\u5b66\u4e60\u201d\u4e86\u3002<\/span><\/p>\n<p style=\"margin-top: 10px; margin-bottom: 10px; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(136, 136, 136);\">AlphaGo\u662f\u4e2a\u5927\u5de5\u7a0b\uff0c\u9664\u4e86\u201c\u5f3a\u5316\u5b66\u4e60\u201d\uff0c\u8fd8\u5229\u7528\u4e86\u201c\u8499\u7279\u5361\u6d1b\u6811\u641c\u7d22\u201d\u7b49\u591a\u79cd\u6280\u672f\uff0c\u4eca\u5929\u6211\u4eec\u4e0d\u53bb\u8bb2\u8fd9\u4e9b\u590d\u6742\u7684\u6280\u672f\uff0c\u5c31\u5355\u5355\u8bb2\u4e0b\uff0c\u5565\u662f\u5f3a\u5316\u5b66\u4e60\uff1f<\/span><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p><br  \/><\/p>\n<section  class=\"mpa-template\"  style=\"margin-left: 0.5em; margin-right: 0.5em;\">\n<section style=\"margin-top: 20px;display: -webkit-box;display: flex;-webkit-box-pack: center;justify-content: center;-webkit-box-align: center;align-items: center;\" >\n<section style=\"width: 35px;height: 35px;\" >\n<section style=\"width: 100%; height: 100%; display: flex; -webkit-box-pack: center; justify-content: center; -webkit-box-align: center; align-items: center; border-radius: 50%; border-width: 1px; border-style: solid; border-color: rgb(105, 13, 3);\" >\n<section style=\"background-color: rgb(105, 13, 3); padding: 5px; color: rgb(255, 255, 255); width: 80%; height: 80%; border-radius: 50%; font-size: 14px; line-height: 20px; text-align: center;\" >1<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin-top: 10px; line-height: 2em; margin-left: 0.5em; margin-right: 0.5em; text-align: center;\"><strong><span style=\"color: rgb(123, 12, 0);\">\u4ec0\u4e48\u662f\u5f3a\u5316\u5b66\u4e60\uff1f<\/span><\/strong><\/p>\n<p style=\"margin-top: 10px; margin-bottom: 10px; line-height: 2em;\"><br  \/><\/p>\n<section   style=\"letter-spacing: 0.5px; display: inline !important; margin-left: 0.5em; margin-right: 0.5em;\">\n<section style=\"letter-spacing: 0.5px; display: inline !important;\">\n<section   style=\"display: inline !important;\">\n<section style=\"display: inline !important;\">\n<section style=\"display: inline !important; margin-left: 0.5em; margin-right: 0.5em; letter-spacing: 0.5px;\"><span style=\"font-size: 14px;\"><strong><span style=\"color: rgb(123, 12, 0); font-size: 14px;\">1\u3001\u5f3a\u5316\u5b66\u4e60\u7684\u6982\u5ff5<\/span><\/strong><\/span><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u5f3a\u5316\u5b66\u4e60\u662f\u4e00\u79cd\u901a\u8fc7\u4e3b\u4f53\uff08Agent\uff09\u4e0e\u73af\u5883\uff08Environment\uff09\u4ea4\u4e92\u800c\u8fdb\u884c\u5b66\u4e60\u7684\u65b9\u6cd5\u3002\u5b83\u65e2\u4e0d\u5c5e\u4e8e\u6709\u76d1\u7763\u5b66\u4e60\uff0c\u4e5f\u4e0d\u5c5e\u4e8e\u65e0\u76d1\u7763\u5b66\u4e60\u3002\u5b83\u7684\u76ee\u6807\u662f\u8981\u901a\u8fc7\u4e0e\u73af\u5883\uff08Environment\uff09\u4ea4\u4e92\uff0c\u6839\u636e\u73af\u5883\u7684\u53cd\u9988\uff08Reward\uff09\uff0c\u4f18\u5316\u81ea\u5df1\u7684\u7b56\u7565\uff08Policy\uff09\uff0c\u518d\u6839\u636e\u7b56\u7565\u884c\u52a8\uff08Action\uff09\uff0c\u4ee5\u83b7\u5f97\u66f4\u591a\u66f4\u597d\u7684\u53cd\u9988\u5956\u52b1\uff08Reward\uff09\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 540px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma0-1534232142.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u8fd9\u662f\u4e00\u4e2a\u884c\u52a8&amp;\u53cd\u9988\u73af\uff0c\u7b80\u5355\u7684\u6765\u8bb2\u5c31\u662f\u5f3a\u5316\u5b66\u4e60\u7684\u4e3b\u4f53\u53ef\u4ee5\u901a\u8fc7\u73af\u5883\u7684\u53cd\u9988\uff0c\u5c06\u81ea\u5df1\u5b8c\u6210\u4efb\u52a1\u7684\u65b9\u5f0f\u4f18\u5316\u7684\u8d8a\u6765\u8d8a\u597d\uff0c\u4e0b\u9762\u7684\u52a8\u56fe\u5c31\u5f88\u597d\u7684\u8bf4\u660e\u4e86\u8fd9\u4e2a\u60c5\u51b5\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 540px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma2-1534232142.gif\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 14px;\"><strong><span style=\"color: rgb(123, 12, 0);\">2\u3001\u9664\u4e86\u4e0b\u68cb\uff0c\u5f3a\u5316\u5b66\u4e60\u8fd8\u80fd\u5e72\u70b9\u5565\uff1f<\/span><\/strong><\/span><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u9664\u4e86\u4e0b\u68cb\uff0c\u5f3a\u5316\u5b66\u4e60\u5728\u5176\u5b83\u65b9\u9762\u7684\u5e94\u7528\u4e5f\u662f\u975e\u5e38\u7684\u706b\u70ed\uff0c\u6bd4\u5982\uff0c\u81ea\u52a8\u9a7e\u9a76\uff0c\u518d\u4e5f\u4e0d\u9700\u8981\u8001\u53f8\u673a\u5566\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: auto;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma3-1534232143.gif\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u518d\u6bd4\u5982\uff0c\u673a\u5668\u4eba\u673a\u68b0\u81c2\u7684\u63a7\u5236\u5b66\u4e60\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: auto;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma9-1534232143.gif\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u751a\u81f3\uff0c\u63a7\u5236\u822a\u5929\u5668\u7684\u7740\u9646\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: auto;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma8-1534232143.gif\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: left; letter-spacing: 0.5px; line-height: 2em;\"><inherit><span style=\"color: rgb(123, 12, 0);\"><strong><span style=\"color: rgb(123, 12, 0); font-size: 14px;\">3\u3001\u5f3a\u5316\u5b66\u4e60\u7684\u72ec\u7279\u4e4b\u5904<\/span><\/strong><\/span><\/inherit><\/p>\n<p style=\"margin-left: 0.5em; margin-right: 0.5em;\"><span style=\"font-size: 13px;\">\u5f3a\u5316\u5b66\u4e60\u5373\u4e0d\u5c5e\u4e8e\u6709\u76d1\u7763\u5b66\u4e60\uff0c\u4e5f\u4e0d\u5c5e\u4e8e\u65e0\u76d1\u7763\u5b66\u4e60\uff0c\u8fd9\u662f\u4e3a\u4ec0\u4e48\u54ea\uff1f<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: auto;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma7-1534232143.jpeg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u7b3c\u7edf\u7684\u8bb2\uff0c\u5f3a\u5316\u5b66\u4e60\u548c\u76d1\u7763\u5b66\u4e60\u8fd8\u662f\u6709\u4e00\u4e9b\u5171\u540c\u70b9\u7684\uff0c\u6bd4\u5982\u4e24\u8005\u90fd\u662f\u6839\u636e\u8f93\u5165\u505a\u51fa\u51b3\u7b56\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u4f46\u662f\u4e24\u8005\u7684\u5dee\u522b\u4e5f\u5f88\u5927\u3002\u6bd4\u5982\u5728\u76d1\u7763\u5b66\u4e60\u4e2d\uff0c\u4e00\u822c\u4e00\u6b21\u8f93\u5165\u5bf9\u5e94\u4e00\u6b21\u8f93\u51fa\uff0c\u5373\u8f93\u5165\u548c\u8f93\u51fa\u5728\u65f6\u95f4\u5e8f\u5217\u4e0a\u662f\u5bf9\u5e94\u7684\u3002\u800c\u5f3a\u5316\u5b66\u4e60\u4e2d\uff0c\u4e00\u822c\u662f\u4ee5\u4e00\u4e2a\u5e8f\u5217\u5316\u7684\u6570\u636e\u4f5c\u4e3a\u8f93\u5165\uff0c\u9700\u8981\u4e0d\u505c\u7684\u4f5c\u51fa\u51b3\u7b56\u3002\u5e76\u4e14\u5728\u91c7\u53d6\u4e00\u4e2a\u52a8\u4f5c\u540e\uff0c\u5e76\u4e0d\u80fd\u7acb\u523b\u5f97\u5230\u73af\u5883\u7684\u53cd\u9988\u3002\u6bd4\u5982\u4e0b\u56f4\u68cb\u7684\u65f6\u5019\u572817\u6b65\u8d70\u4e86\u4e00\u5b50\uff0c\u5bfc\u81f4\u572833\u6b65\u7684\u65f6\u5019\u8f93\u6389\u4e86\u6574\u76d8\u68cb\u3002\u73af\u5883\u5e76\u4e0d\u80fd\u572817\u6b65\u7684\u65f6\u5019\u5c31\u544a\u8bc9\u4f60\u8d70\u7684\u4e0d\u597d\uff0c\u53ea\u80fd\u5728\u8f93\u6389\u6574\u76d8\u68cb\u540e\uff0c\u518d\u53bb\u601d\u8003\u54ea\u4e00\u6b65\u8d70\u7684\u4e0d\u597d\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u6240\u4ee5\u5f3a\u5316\u5b66\u4e60\u8981\u601d\u8003\u600e\u6837\u624d\u80fd\u8fbe\u5230\u4e00\u4e2a\u957f\u671f\u7684\u76ee\u6807\uff0c\u800c\u4e0d\u80fd\u53ea\u987e\u53ca\u773c\u524d\u7684\u5229\u76ca\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\"><\/span><\/p>\n<section  class=\"mpa-template\"  style=\"margin-left: 0.5em; margin-right: 0.5em;\">\n<section style=\"margin-top: 20px;display: -webkit-box;display: flex;-webkit-box-pack: center;justify-content: center;-webkit-box-align: center;align-items: center;\" >\n<section style=\"width: 35px;height: 35px;\" >\n<section style=\"width: 100%; height: 100%; display: flex; -webkit-box-pack: center; justify-content: center; -webkit-box-align: center; align-items: center; border-radius: 50%; border-width: 1px; border-style: solid; border-color: rgb(105, 13, 3);\" >\n<section style=\"background-color: rgb(105, 13, 3); padding: 5px; color: rgb(255, 255, 255); width: 80%; height: 80%; border-radius: 50%; font-size: 14px; line-height: 20px; text-align: center;\" >2<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px; text-align: center;\"><span style=\"color: rgb(123, 12, 0);\"><strong>\u5f3a\u5316\u5b66\u4e60\u7684\u6838\u5fc3<\/strong><\/span><\/p>\n<section   style=\"display: inline !important; margin-left: 0.5em; margin-right: 0.5em;\">\n<section style=\"display: inline !important;\">\n<section style=\"display: inline !important;\">\n<p style=\"margin-left: 0.5em; margin-right: 0.5em;\"><span style=\"font-size: 14px; color: rgb(123, 12, 0);\"><strong>1\u3001\u5efa\u6a21\u53ca\u6838\u5fc3\u6982\u5ff5<\/strong><\/span><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\">\u8981\u6df1\u523b\u4e86\u89e3\u5f3a\u5316\u5b66\u4e60\uff0c\u6700\u597d\u5148\u719f\u6089\u5f3a\u5316\u5b66\u4e60\u5728\u6a21\u578b\u4e0a\u662f\u5982\u4f55\u5b9a\u4e49\u7684\uff0c\u4e0b\u9762\u6211\u4eec\u5c31\u8ba8\u8bba\u4e0b\u5f3a\u5316\u5b66\u4e60\u7684\u6a21\u578b\u5b9a\u4e49\u65b9\u6cd5\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\">\u5f3a\u5316\u5b66\u4e60\u662f\u4ee5MDP\uff08Markov Decision Process)\u4f5c\u4e3a\u57fa\u7840\u6a21\u578b\u7684\u3002\u5373\u5047\u8bbe\u73af\u5883\u72b6\u6001\uff08state\uff09\u662f\u201cMarkov\u201d\u7684\uff0c\u8fd9\u8868\u793astate\u672a\u6765\u7684\u53d8\u5316\uff0c\u53ea\u4e0e\u5f53\u524d\u7684\u72b6\u6001\u6709\u5173\uff0c\u8ddf\u8fc7\u53bb\u7684\u72b6\u6001\u6ca1\u6709\u4efb\u4f55\u5173\u7cfb\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\">\u4e3e\u4e2a\u4f8b\u5b50\uff0c\u5f53\u6211\u4eec\u53bb\u89c2\u5bdf\u522b\u4eba\u4e0b\u68cb\u7684\u65f6\u5019\uff0c\u6211\u4eec\u8fc7\u53bb\u4e00\u770b\u5c31\u80fd\u77e5\u9053\u5f53\u524d\u7684\u68cb\u5c40\u72b6\u6001\u662f\u600e\u4e48\u6837\u7684\uff0c\u751a\u81f3\u8fd8\u53ef\u4ee5\u4e03\u5634\u516b\u820c\u7684\u6307\u5bfc\u68cb\u624b\u600e\u4e48\u8d70\uff0c\u8fd9\u5e76\u4e0d\u9700\u8981\u77e5\u9053\u4ed6\u4eec\u4e4b\u524d\u4e0b\u68cb\u7684\u6b65\u9aa4\u3002<\/span><img     style=\"letter-spacing: 0.5px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 540px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma2-1534232144.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><span style=\"font-size: 13px;\">\u6240\u4ee5\uff0c\u4e3b\u4f53\u6240\u505a\u7684\u7b56\u7565\uff08Policy)\u5c31\u53ef\u4ee5\u8868\u793a\u6210\uff1a<\/span><img     style=\"height: 77px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 416px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma8-1534232144.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u5373\u8868\u793a\u5f53\u524d\u7684\u72b6\u6001St\uff0c\u52a8\u4f5cAt\uff0c\u5df2\u7ecf\u5305\u542b\u4e86\u8fc7\u53bb\u6240\u6709\u6709\u7528\u7684\u4fe1\u606f\uff08S0,A0,R1\u2026\u2026\uff09\u3002\u6709\u4e86\u4e0a\u9762\u7684\u5047\u8bbe\uff0c\u673a\u5668\u6240\u505a\u7684\u51b3\u7b56\uff08\u03c0\uff0cPolicy\uff0c\u8868\u793a\u4e0b\u4e00\u6b65\u884c\u52a8\u7684\u7b56\u7565\uff09\uff0c\u53ef\u4ee5\u8868\u793a\u6210\u53ea\u4e0e\u5f53\u524d\u72b6\u6001\u6709\u5173\u7684\u51fd\u6570\u3002<\/span><img     style=\"text-align: center; height: 106px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 452px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma9-1534232144.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u90a3\u4e48\u600e\u4e48\u624d\u80fd\u8ba9\u7b56\u7565\u8fbe\u5230\u6700\u4f18\u54ea\uff1f<\/span><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><strong style=\"color: rgb(123, 12, 0);\"><span style=\"font-size: 14px;\">2\u3001\u4f18\u5316\u7b56\u7565\uff08policy\uff09\u7684\u76ee\u6807<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u8981\u6c42\u51fa\u6700\u4f18\u7684\u7b56\u7565\uff0c\u6211\u4eec\u8fd8\u9700\u8981\u8fdb\u884c\u4e00\u4e2a\u5047\u8bbe\u3002<\/span><\/p>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"height: 150px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 263px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma8-1534232144.jpeg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u8fd9\u4e2a\u5047\u8bbe\u5c31\u662f\uff1a\u6211\u4eec\u4f18\u5316policy\u9700\u8981\u8fbe\u5230\u7684\u6240\u6709\u76ee\u6807\u5168\u90e8\u5305\u542b\u5728\u73af\u5883\u7ed9\u4e88\u7684\u5956\u52b1\uff08reward\uff09\u4e2d\u3002\u6240\u4ee5\u8981\u6c42\u6700\u4f18\u5316\u7684\u7b56\u7565\uff0c\u5c31\u9700\u8981\u5c3d\u53ef\u80fd\u7684\u83b7\u53d6\u66f4\u591areward\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"height: 68px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 407px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma7-1534232144.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u90a3\u4e48\u6211\u4eec\u5c31\u5b9a\u4e49\u4e00\u4e2a\u5f0f\u5b50\uff0c\u628a\u5f3a\u5316\u5b66\u4e60\u5728\u4e00\u8f6e\u5b66\u4e60\u8fc7\u7a0b\u4e2d\u80fd\u83b7\u53d6\u7684reward\u90fd\u52a0\u8d77\u6765\u3002\u5728\u76f8\u52a0\u65f6\u9700\u8981\u7ed9\u4e0d\u540c\u65f6\u523b\u7684reward\u4e58\u4ee5\u4e00\u4e2a\u4e0d\u540c\u7684\u7cfb\u6570\u3002\u4e3a\u4ec0\u4e48\u8981\u4e58\u4ee5\u4e00\u4e2a\u6743\u503c\uff1f\u56e0\u4e3a\u4e0d\u540c\u65f6\u95f4\u6bb5\u7684reward\u5bf9\u76ee\u6807\u7684\u5f71\u54cd\u7a0b\u5ea6\u4e0d\u540c\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u628a\u6240reward\u52a0\u8d77\u6765\u7684\u503c\u53eb\u505aReturn\uff0c\u4ee3\u8868\u5f3a\u5316\u5b66\u4e60\u5728\u672a\u6765\u80fd\u62ff\u5230\u7684\u6240\u6709\u6536\u76ca\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u6211\u4eec\u5bf9Return\u53d6\u4e00\u4e2a\u671f\u671b\uff0c\u5c31\u83b7\u5f97\u4e86Value\u51fd\u6570\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; text-align: center; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"height: 60px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 421px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma2-1534232144-1.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u5728\u8fd9\u4e2a\u51fd\u6570\u4e2d\uff0cs\u4ee3\u8868\u73af\u5883\u72b6\u6001\uff08state\uff09\uff0c\u03c0\u662f\u7b56\u7565\uff08policy\uff09\uff0cv\u662fstate\u7684value\uff0c\u4ee3\u8868\u5728\u8fd9\u4e2astate\u4e0b\uff0c\u91c7\u53d6\u8fd9\u4e2a\u7b56\u7565\uff0c\u6211\u4eec\u672a\u6765\u80fd\u62ff\u5230\u591a\u5c11\u56de\u62a5\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u7406\u60f3\u72b6\u6001\u4e0b\uff0cValue\u51fd\u6570\u662f\u53ea\u4e0e\u5f53\u524d\u73af\u5883\u72b6\u6001\uff08state\uff09\u6709\u5173\u7684\u51fd\u6570\u3002\u56e0\u4e3a\u5f53\u524d\u7684\u73af\u5883\u72b6\u6001\uff08state\uff09\u51b3\u5b9a\u4e86\u7cfb\u7edf\u672a\u6765\u7684\u8d70\u5411\uff0c\u4e5f\u5c31\u51b3\u5b9a\u4e86\u672a\u6765\u7684\u73af\u5883\u72b6\u6001\uff08state\uff09\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u5b9e\u9645\u5e94\u7528\u4e2d\uff0c\u9700\u8981\u5f53\u524dstate\u548c\u7b56\u7565\uff08policy\uff09\u4e00\u8d77\u624d\u80fd\u51b3\u5b9a\u672a\u6765\u7684state\u3002\u56e0\u4e3a\u6839\u636epolicy\u91c7\u53d6\u7684\u884c\u52a8\uff08action\uff09\u4f1a\u5f71\u54cd\u73af\u5883\u7684\u8d70\u5411\uff0c\u4e5f\u5c31\u662f\u5f71\u54cdstate\u7684\u53d8\u5316\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u6211\u4eec\u6709\u4e86Value\u51fd\u6570\u6765\u8ba1\u7b97\u5728\u5f53\u524d\u72b6\u6001\u4e0b\uff0c\u91c7\u53d6\u6bcf\u79cd\u7b56\u7565\uff08policy\uff09\u80fd\u83b7\u5f97\u7684\u6536\u76ca\uff0c\u90a3\u4e48\u6211\u4eec\u5c31\u53ef\u4ee5\u8ba1\u7b97\u6bcf\u4e2a\u884c\u52a8\uff08action\uff09\u80fd\u83b7\u5f97\u6536\u76ca\uff08\u7cfb\u7edf\u6839\u636e\u7b56\u7565\u91c7\u53d6\u884c\u52a8\uff09\u3002\u54ea\u4e00\u4e2aaction\u80fd\u83b7\u5f97\u7684\u6536\u76ca\uff08Value\uff09\u8d8a\u5927\uff0c\u6211\u4eec\u5c31\u91c7\u7528\u54ea\u4e2aaction\u3002\u6240\u4ee5\u7cfb\u7edf\u603b\u662f\u80fd\u9009\u62e9\u51fa\u6700\u4f18\u7684\u7b56\u7565\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u7136\u800c\u8fd9\u79cd\u65b9\u6cd5\u6709\u4e00\u4e2a\u95ee\u9898\uff0c\u6709\u65f6\u5019\u7cfb\u7edf\u5e76\u4e0d\u80fd\u76f4\u89c2\u7684\u83b7\u5f97\u6bcf\u4e2aaction\u6240\u5bf9\u5e94\u7684value\uff0c\u56e0\u4e3a\u73af\u5883\u5b58\u5728\u52a8\u6001\u6027\u3002\u6bd4\u5982\u5bf9\u4e00\u4e2a\u5728\u73b0\u5b9e\u73af\u5883\u91cc\u884c\u52a8\u7684\u673a\u5668\u4eba\u6765\u8bf4\uff0c\u5b83\u5728\u91c7\u53d6\u4e00\u4e2aaction\u7684\u65f6\u5019\uff0c\u6709\u65f6\u5019\u4f1a\u78b0\u5230\u5899\uff0c\u6709\u65f6\u5019\u8fd8\u6ca1\u884c\u52a8\u5c31\u5df2\u7ecf\u6454\u5012\u4e86\uff0c\u5f80\u5f80\u4e0d\u80fd\u987a\u5229\u7684\u83b7\u53d6action\u5bf9\u5e94\u7684value\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u9488\u5bf9\u8fd9\u79cd\u95ee\u9898\uff0c\u6211\u4eec\u5b9a\u4e49\u4e00\u4e2a\u65b0\u7684Value function\uff0c\u53eb\u505aAction-Value function\u3002\u5b83\u4e0d\u4ec5\u662fstate\u7684\u51fd\u6570\uff0c\u4e5f\u662fAction\u7684\u51fd\u6570\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"height: 60px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 458px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma0-1534232144.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u6240\u4ee5\u6211\u4eec\u5c31\u4e0d\u9700\u8981\u9884\u6d4b\u4e0b\u4e00\u4e2astate\uff0c\u6211\u4eec\u53ea\u9700\u8981\u9488\u5bf9\u6211\u4eec\u5f53\u524d\u7684state\uff0c\u770b\u4e00\u4e0b\u54ea\u4e00\u4e2aaction\u53ef\u4ee5\u4f7fq\u03c0(s,a)\u6700\u5927\uff0c\u90a3\u6211\u4eec\u5c31\u53ef\u4ee5\u9009\u62e9\u8fd9\u4e2aaction\uff0c\u8fd9\u6837\u6211\u4eec\u5c31\u4e0d\u9700\u8981\u5bf9\u6574\u4e2a\u4e16\u754c\u7684\u52a8\u6001\u6027\u8fdb\u884c\u5efa\u6a21\uff0c\u6240\u4ee5\u8fd9\u79cd\u65b9\u5f0f\u53eb\u505a\u201cmodel-free\u201d\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><strong style=\"color: rgb(123, 12, 0); font-size: 14px;\">3\u3001on-policy &amp; off-policy<\/strong><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u5728\u6211\u4eec\u4e0a\u9762\u8bb2\u5230\u7684\u4e24\u4e2a\u4ef7\u503c\u51fd\u6570\u4e2d\uff0c\u90fd\u5305\u542b\u6709\u03c0\uff08\u5373policy\uff09\uff0c\u6240\u4ee5\u5b83\u4eec\u90fd\u662f\u8ddf\u7b56\u7565\u6709\u5173\u7684\u3002policy\u4f1a\u5f71\u54cd\u672a\u6765\u7684state\u4f1a\u600e\u4e48\u53d1\u5c55\uff0cvalue\u7684\u8ba1\u7b97\u9700\u8981policy\uff0c\u800cpolicy\u53c8\u662f\u6839\u636evalue\u6765\u91c7\u53d6\u7684\uff0c\u6240\u4ee5policy\u548cvalue\u662f\u4e92\u76f8\u5f71\u54cd\u7684\u3002\u6240\u4ee5\u6211\u4eec\u628a\u8fd9\u79cdvalue\u53d7policy\u7ea6\u675f\u7684\u5b66\u4e60\u65b9\u6cd5\uff0c\u53eb\u505a\u201con-policy\u201d\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u4e0e\u4e4b\u5bf9\u5e94\uff0c\u8fd8\u6709\u4e00\u79cd\u53eb\u505a\u201coff-policy\u201d\u7684\u5b66\u4e60\u65b9\u6cd5\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">on-policy\u4f30\u8ba1\u7684\u662f\u5f53\u524d\u7b56\u7565\u7684value\uff0c\u800coff-policy\u4f30\u8ba1\u7684\u662f\u6700\u4f18\u7b56\u7565\u7684value\u3002\u5373\u4e0d\u518d\u4f30\u8ba1\u81ea\u5df1\u5728\u5f53\u524d\u72b6\u6001\u4e0b\u80fd\u8fbe\u5230\u591a\u5c11\u56de\u62a5\uff0c\u800c\u662f\u4f30\u8ba1\u5728\u6700\u4f18\u7684\u60c5\u51b5\u4e0b\uff0c\u672a\u6765\u6700\u5927\u80fd\u62ff\u5230\u591a\u5c11\u56de\u62a5\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"height: 61px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 471px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma4-1534232144.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u4e3e\u4e2a\u4f8b\u5b50\uff1a\u5bf9\u5f85\u540c\u4e00\u76d8\u56f4\u68cb\uff0c\u6211\u6709\u6211\u7684value\uff0c\u67ef\u6d01\u6709\u67ef\u6d01\u7684value\uff0c\u67ef\u6d01\u7684value\u5f88\u5927\uff0c\u56e0\u4e3a\u4ed6\u4e0b\u56f4\u68cb\u5f88\u5389\u5bb3\uff0c\u800c\u6211\u7684value\u5f88\u5c0f\uff0c\u56e0\u4e3a\u6211\u4e0d\u4f1a\u4e0b\u56f4\u68cb\u3002\u5373\u5728off-policy\u7684\u60c5\u51b5\u4e0b\uff0c\u4f18\u5316\u7684\u5e76\u4e0d\u662f\u5f53\u524dpolicy\u7684value\u4e86\uff0c\u800c\u662f\u6240\u6709\u53ef\u80fdvalue\u7684\u6700\u5927\u503c\uff0c\u5373value\u7684\u4f18\u5316\u548c\u5f53\u524d\u7684policy\u6ca1\u6709\u5173\u7cfb\uff0c\u6240\u4ee5\u53eb\u201coff-policy\u201d\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u90a3\u8fd9\u4e2avalue\u7684\u6700\u5927\u503c\u8981\u600e\u6837\u8ba1\u7b97\uff1f<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><inherit><img     style=\"height: 125px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 519px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma0-1534232145.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 14px;\">\u8fd9\u5c31\u8981\u91c7\u7528\u4e0a\u9762\u7684\u8d1d\u5c14\u66fc\u65b9\u7a0b\uff0c\u628aq*(s,a)\u7684\u5b9a\u4e49\uff0c\u5199\u6210\u4e00\u4e2a\u8fed\u4ee3\u7684\u65b9\u5f0f\u3002\u8ba9\u5f53\u524dstate\u7684value\uff0c\u901a\u8fc7\u4e0b\u4e00\u4e2astate\u6765\u51b3\u5b9a\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><strong style=\"color: rgb(123, 12, 0); font-size: 14px;\">4\u3001\u4f30\u8ba1value\u7684\u65b9\u6cd5<\/strong><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u4e0a\u9762\u6211\u4eec\u8bf4\u8ba1\u7b97value\u5b9e\u9645\u4e0a\u662f\u4e0d\u51c6\u786e\u7684\uff0c\u56e0\u4e3a\u6211\u4eec\u65e0\u6cd5\u8ba1\u7b97\u51favalue\u7684\u7cbe\u786e\u503c\uff0c\u53ea\u80fd\u901a\u8fc7\u4f30\u8ba1\u3002\u4f30\u8ba1value\u7684\u7b97\u6cd5\u6709\u5f88\u591a\uff0c\u4e00\u822c\u5206\u4e3a\u4e0b\u9762\u4e09\u4e2a\u5927\u7c7b\u522b\uff0c\u4e0b\u9762\u6211\u4eec\u5c31\u6765\u76d8\u70b9\u4e00\u4e0b\u8fd9\u4e09\u79cd\u7c7b\u522b\u7684\u7b97\u6cd5\u5404\u6709\u4ec0\u4e48\u7279\u70b9\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><strong><span style=\"font-size: 13px;\">Monte Carlo\uff1a<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u8fd9\u79cd\u7b97\u6cd5\u7684\u7279\u70b9\u662f\uff0c\u4e0d\u80fd\u5728\u6bcf\u4e00\u6b21state\u53d8\u5316\u540e\u5c31\u66f4\u65b0value\uff0c\u53ea\u80fd\u5728\u4e00\u6b21\u5b8c\u6574\u7684\u5b66\u4e60\u8fc7\u7a0b\uff08\u6bd4\u5982\u4e00\u76d8\u68cb\uff09\u7ed3\u675f\u540e\uff0c\u901a\u8fc7\u83b7\u53d6\u6700\u7ec8\u7684\u603b\u6536\u76ca\uff08Return\uff09\uff0c\u518d\u5bf9\u8fc7\u7a0b\u4e2d\u6bcf\u4e2astate\u7684value\u8fdb\u884c\u66f4\u65b0\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u5b83\u7684\u4f18\u70b9\u662f\u4e0d\u9700\u8981\u5bf9\u73af\u5883\u8fdb\u884c\u5efa\u6a21\uff0c\u5373\u201cModel-free\u201d\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><strong><span style=\"font-size: 13px;\">Dynamic Programming\uff1a<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u8fd9\u79cd\u7b97\u6cd5\u9700\u8981\u5bf9\u73af\u5883\u5efa\u7acb\u4e00\u4e2a\u5b8c\u6574\u51c6\u786e\u7684\u6a21\u578b\uff0c\u8fd9\u6837\u4ee5\u6765\u7cfb\u7edf\u7684\u72b6\u6001\u53d8\u5316\u90fd\u662f\u53ef\u4ee5\u8ba1\u7b97\u5230\u7684\u3002\u518d\u4f7f\u7528\u8d1d\u5c14\u66fc\u65b9\u7a0b\uff0c\u901a\u8fc7\u672a\u6765\u7684\u72b6\u6001\u5012\u63a8\u73b0\u5728\u7684\u72b6\u6001\u3002\u7136\u540e\u4f7f\u7528Bootstrapping\u7b97\u6cd5\uff0c\u7528\u672a\u6765\u7684value\u6765\u66f4\u65b0\u73b0\u5728\u7684value\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><strong><span style=\"font-size: 13px;\">Temporal-Difference Learning\uff1a<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u8fd9\u79cd\u7b97\u6cd5\u7ed3\u5408\u4e86\u4e0a\u8ff0\u4e24\u79cd\u65b9\u6cd5\u7684\u4f18\u70b9\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u5373\u4e0d\u9700\u8981\u5bf9\u73af\u5883\u5efa\u6a21\uff08Model-free\uff09\uff0c\u53c8\u53ef\u4ee5\u4f7f\u7528Bootstrapping\uff0c\u62ff\u672a\u6765\u7684value\u6765\u4f30\u8ba1\u73b0\u5728\u7684value\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u5728\u5b9e\u9645\u7684\u5e94\u7528\u4e2d\uff0c\u88ab\u91c7\u7528\u7684\u5927\u90e8\u5206\u7684\u7b97\u6cd5\u90fd\u662f\u57fa\u4e8eTemporal-Difference Learning\u7684\u3002\u63a5\u4e0b\u6765\u6211\u4eec\u5c31\u6765\u91cd\u70b9\u8bb2\u4e00\u4e0b\u6700\u5e38\u7528\u7684\u4e24\u79cd\u7b97\u6cd5\uff1aSARSA \u548c Q-Learning \u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\"><\/span><\/p>\n<section  class=\"mpa-template\"  style=\"margin-left: 0.5em; margin-right: 0.5em;\">\n<section style=\"margin-top: 20px;display: -webkit-box;display: flex;-webkit-box-pack: center;justify-content: center;-webkit-box-align: center;align-items: center;\" >\n<section style=\"width: 35px;height: 35px;\" >\n<section style=\"width: 100%; height: 100%; display: flex; -webkit-box-pack: center; justify-content: center; -webkit-box-align: center; align-items: center; border-radius: 50%; border-width: 1px; border-style: solid; border-color: rgb(105, 13, 3);\" >\n<section style=\"background-color: rgb(105, 13, 3); padding: 5px; color: rgb(255, 255, 255); width: 80%; height: 80%; border-radius: 50%; font-size: 14px; line-height: 20px; text-align: center;\" >3<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px; text-align: center;\"><strong><span style=\"color: rgb(123, 12, 0);\">SARSA&amp;Q-Learning\u7b97\u6cd5<\/span><\/strong><strong style=\"font-size: 18px;\"><span style=\"color: rgb(123, 12, 0); font-size: 14px;\"><\/span><\/strong><\/p>\n<section   style=\"display: inline !important; margin-left: 0.5em; margin-right: 0.5em;\">\n<section style=\"display: inline !important;\">\n<section style=\"display: inline !important;\">\n<p><br  \/><\/p>\n<p style=\"margin-left: 0.5em; margin-right: 0.5em;\"><span style=\"font-size: 14px;\"><strong><span style=\"color: rgb(123, 12, 0);\">1\u3001SARSA &amp; Q-Learning \u7b97\u6cd5\u5f02\u540c<\/span><\/strong><\/span><\/p>\n<p style=\"margin-left: 0.5em; margin-right: 0.5em;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\"><br  \/><\/span><\/p>\n<p style=\"margin-left: 0.5em; margin-right: 0.5em;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\">\u8fd9\u4e24\u79cd\u90fd\u662f\u5bf9Q value\uff08\u5373action-value function\uff09\u505a\u4f30\u8ba1\uff0c\u90fd\u662f\u8fed\u4ee3\u66f4\u65b0value\u7684\u503c\u3002SARSA\uff08on-policy\uff09\uff1a<\/span><\/p>\n<p style=\"margin-left: 0.5em; margin-right: 0.5em;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\"><br  \/><\/span><\/p>\n<p style=\"margin-left: 0.5em; margin-right: 0.5em;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\">\u8fd9\u79cd\u7b97\u6cd5\u662f\u5728\u6bcf\u4e00\u6b21\u884c\u52a8\uff08Action\uff09\u540e\uff0c\u6839\u636e\u4e0b\u4e00\u523b\u7cfb\u7edf\u8bc6\u522b\u5230\u7684\u73af\u5883\u72b6\u6001\u53d8\u5316\uff08state\uff09\uff0c\u66f4\u65b0\u8fd9\u4e00\u523b\u7684value\u3002\u5373Q\u662f\u9488\u5bf9\u5f53\u524dPolicy\u7684\u3002<\/span><\/p>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><inherit><img     style=\"height: 129px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 460px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma10-1534232145.jpg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u5bf9\u4e8eSARSA\u6765\u8bf4\uff0c\u6bcf\u6b21\u7684Training data\u662f\u8fd9\u6837\u7684\uff1a<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">St\uff1a\u5f53\u524d\u7684\u72b6\u6001\uff1bAt\uff1a\u5f53\u524d\u7684Action\uff1bRt+1\uff1a\u8fd9\u6b21\u7684Reward\uff1bSt+1\uff1a\u4e0b\u4e00\u6b21\u7684\u72b6\u6001\uff1bAt+1\uff1a\u4e0b\u4e00\u6b21\u7684Action\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u4e4b\u6240\u4ee5\u6709At+1\uff0c\u662f\u56e0\u4e3aQ\u662fS\uff0cA\u7684\u51fd\u6570\uff0c\u5fc5\u987b\u540c\u65f6\u6709\u4e0b\u4e00\u6b65\u7684State\u548cAction\u624d\u80fd\u8ba1\u7b97\u8fd9\u4e00\u65f6\u523b\u7684Q value\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">Q-Learning\uff08off-policy\uff09\uff1a<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u8fd9\u4e2a\u7b97\u6cd5\u4e0d\u5173\u5fc3\u4e0b\u4e00\u6b65Policy\u600e\u4e48\u9009\uff0c\u76f4\u63a5\u6311\u4e00\u4e2a\u80fd\u8ba9\u4e0b\u4e00\u6b65Q\uff08S\uff0cA\uff09\u6700\u5927\u7684Action\u53bb\u505a\u66f4\u65b0\u3002\u516c\u5f0f\u4e2d\u7684maxQ(S&#8217;, a\uff09\u5373\u4ee3\u8868\u6211\u6240\u6709\u7684action\u91cc\uff0c\u54ea\u4e00\u4e2a\u80fd\u8ba9\u4e0b\u4e00\u523b\u7684Q value\u6700\u5927\uff0c\u5c31\u7528\u5b83\u6765\u66f4\u65b0Q value\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><inherit><img     style=\"height: 125px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 474px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma1-1534232145.jpg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u5bf9\u4e8eQ-Learning\u6765\u8bf4\uff0cTraining data\u4e2d\u4e0d\u9700\u8981\u6709At+1\uff0c\u56e0\u4e3a\u4e0d\u9700\u8981\u77e5\u9053\u4e0b\u4e00\u6b65\u7684Action\u8981\u600e\u6837\u9009\u62e9\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"color: rgb(123, 12, 0);\"><strong><span style=\"font-size: 14px;\">2\u3001\u8fd9\u8fd8\u6709\u4e2a\u5927\u95ee\u9898\uff01\u65e0\u6cd5\u7a77\u4e3e\u7684\u73b0\u5b9e\u4e16\u754c<\/span><\/strong><\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u89e3\u51b3\u65b9\u6cd5\u662f\uff1a\u6211\u4eec\u4e0d\u53bb\u4f30\u8ba1\u548c\u4fdd\u5b58\u90a3\u4e48\u591a\u7684value\u548caction\uff0c\u6211\u4eec\u5efa\u7acb\u4e00\u4e2a\u6a21\u578b\u53bb\u62df\u5408value\u51fd\u6570\uff0c\u751a\u81f3\u53bb\u62df\u5408policy\u548cmodel\u3002<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><inherit><img     style=\"height: 125px; border-width: 0px; border-style: initial; border-color: initial; cursor: default; width: 498px;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma5-1534232145.png\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/inherit><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u90a3\u8981\u5982\u4f55\u624d\u80fd\u505a\u5230\u51c6\u786e\u7684\u62df\u5408\uff1f\u54c8\u54c8\uff0c\u90a3\u5c31\u9700\u8981\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u51fa\u573a\u4e86\uff01<\/span><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; background-color: rgb(255, 255, 255); widows: 1;\">\u5c06\u6df1\u5ea6\u795e\u7ecf\u7f51\u7edc\u4e0e\u5f3a\u5316\u5b66\u4e60\u7ed3\u5408\u7684\u6280\u672f\u6211\u4eec\u7edf\u79f0\u4e3a\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u3002\u5b9e\u73b0\u6df1\u5ea6\u5f3a\u5316\u5b66\u4e60\u7684\u65b9\u6cd5\u6709\u591a\u79cd\uff0c\u5176\u4e2d\u5305\u62ec\uff1a<\/span><span style=\"font-size: 13px;\"><\/span><\/p>\n<blockquote>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><strong><span style=\"font-size: 13px; color: rgb(0, 0, 0);\">\u53ef\u4ee5\u8ba9\u673a\u5668\u4eba\u6253\u7535\u52a8\u6e38\u620f\u6bd4\u4eba\u7c7b\u8fd8\u5389\u5bb3\u7684\uff1aDeep Q-Network\uff08DQN\uff09\uff08\u70b9\u51fb\u9605\u8bfb\u539f\u6587\uff09\uff1b<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><strong><span style=\"font-size: 13px; color: rgb(0, 0, 0);\">\u4ee5\u53ca\u5e2e\u52a9 AlphaGo \u9009\u62e9\u843d\u5b50\u7b56\u7565\u7684Policy Gradient\u7b97\u6cd5\uff1b<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><strong><span style=\"font-size: 13px; color: rgb(0, 0, 0);\">\u8fd8\u6709\u8363\u83b7\u4eca\u5e74NIPS\u6700\u4f73\u8bba\u6587\u5956\u7684Value Iteration\u7b97\u6cd5\u3002<\/span><\/strong><\/p>\n<\/blockquote>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(0, 0, 0);\">\u8fd9\u51e0\u79cd\u7b97\u6cd5\u5404\u6709\u4ec0\u4e48\u533a\u522b\uff0c\u90fd\u6709\u4ec0\u4e48\u795e\u901a\uff1f<\/span><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(0, 0, 0);\"><br  \/><\/span><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(0, 0, 0);\"><\/span><\/p>\n<section  class=\"mpa-template\" >\n<section style=\"margin-top: 20px;display: -webkit-box;display: flex;-webkit-box-pack: center;justify-content: center;-webkit-box-align: center;align-items: center;\" >\n<section style=\"width: 35px;height: 35px;\" >\n<section style=\"width: 100%; height: 100%; display: flex; -webkit-box-pack: center; justify-content: center; -webkit-box-align: center; align-items: center; border-radius: 50%; border-width: 1px; border-style: solid; border-color: rgb(105, 13, 3);\" >\n<section style=\"background-color: rgb(105, 13, 3); padding: 5px; color: rgb(255, 255, 255); width: 80%; height: 80%; border-radius: 50%; font-size: 14px; line-height: 20px; text-align: center;\" >4<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px; text-align: center;\"><strong><span style=\"color: rgb(123, 12, 0);\">\u53c2\u8003\u8d44\u6599<br  \/><\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(0, 0, 0);\"><br  \/><\/span><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(0, 0, 0);\">\u5982\u679c\u60f3\u8981\u66f4\u8be6\u7ec6\u7684\u4e86\u89e3\u5173\u4e8e\u5f3a\u5316\u5b66\u4e60\u7684\u5185\u5bb9\uff0c\u53ef\u4ee5\u53c2\u7167\u4e00\u4e0b\u7684\u63a8\u8350\u53c2\u8003\u6750\u6599\uff1a<\/span><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; color: rgb(0, 0, 0);\">\u9996\u5148\u63a8\u8350\u5927\u5bb6\u4e00\u672c\u5173\u4e8e\u5f3a\u5316\u5b66\u4e60\u4ecb\u7ecd\u7684\u4e66\uff1a<\/span><strong><span style=\"font-size: 13px;\">Sutton &amp; Barto.&nbsp;Reinforcement Learning: An Introduction: classic, comprehensive, plenty of examples\uff1b<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u8fd8\u6709\u4e00\u4e9b\u5173\u4e8e\u5f3a\u5316\u5b66\u4e60\u7b97\u6cd5\u7684\u4ecb\u7ecd\uff1a<\/span><strong><span style=\"font-size: 13px;\">CsabaSzepesva\u0301ri. Algorithms for Reinforcement&nbsp;Learning: concise,theoretical<\/span><\/strong><\/p>\n<p style=\"margin-top: 10px; margin-bottom: 10px; line-height: 2em; padding-left: 0.5em; padding-right: 0.5em;\"><span style=\"font-size: 13px;\">\u5173\u4e8e\u5f3a\u5316\u5b66\u4e60\u7684\u6700\u65b0\u7814\u7a76\uff1a<\/span><\/p>\n<p style=\"margin-top: 10px; margin-bottom: 10px; line-height: 2em; padding-left: 0.5em; padding-right: 0.5em;\"><strong><span style=\"font-size: 13px;\">YuxiLi. Deep Reinforcement Learning: An Overview<\/span><\/strong><\/p>\n<p style=\"margin-top: 10px; margin-bottom: 10px; line-height: 2em; padding-left: 0.5em; padding-right: 0.5em;\"><span style=\"font-size: 13px;\">\u548c\u4e00\u4e9bActive researchers\uff1a<\/span><\/p>\n<p style=\"margin-top: 10px; margin-bottom: 10px; line-height: 2em; padding-left: 0.5em; padding-right: 0.5em;\"><strong><span style=\"font-size: 13px;\">Pieter Abbeel, Sergey Levine, John Schulman, David Silver, Timothy Lillicrap, Volodymyr Mnih, Shixiang Gu&nbsp;<\/span><\/strong><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">\u5f53\u7136\u5982\u679c\u4f60\u60f3\u4ee5\u4e00\u79cd\u66f4\u6709\u8da3\u7684\u65b9\u5f0f\u6765\u4e86\u89e3\u5f3a\u5316\u5b66\u4e60\uff0c\u8bf7\u67e5\u770b\u6765\u81ea<strong>\u6fb3\u6d32\u683c\u91cc\u83f2\u65af\u5927\u5b66\u5728\u8bfb\u535a\u58eb\u751f\u83ab\u70e6\u7684\u300a\u5f3a\u5316\u5b66\u4e60\u4ecb\u7ecd\u7cfb\u5217\u300b\u3002<\/strong><\/span><\/p>\n<p style=\"margin: 10px 0.5em; color: rgb(62, 62, 62); font-size: 16px; white-space: normal; widows: 1; text-align: left; background-color: rgb(255, 255, 255); line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px;\">http:\/\/campus.swarma.org\/gpac=16#src=2<\/span><img      src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma1-1534232145-1.jpg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/p>\n<p style=\"margin: 10px 0.5em; white-space: normal; letter-spacing: 0.5px; line-height: 2em;\"><span style=\"font-size: 13px;\">\u6700\u540e\uff0c\u6211\u518d\u7ed9\u5927\u5bb6\u5b89\u5229\u4e00\u95e8<strong>\u76f4\u64ad<\/strong>\u7684\u8bfe\u7a0b\uff0c\u4f5c\u4e3a\u8bfe\u7a0b\u8d28\u91cf\u62c5\u5f53\u7684\u201c\u5c0fS\u201d\u7684\u674e\u5ae3\u7136\u53c8\u4e00\u6b21\u5728\u96c6\u667a\u4ff1\u4e50\u90e8\u5f00\u8bfe\uff0c\u624b\u628a\u624b\u6559\u5927\u5bb6\u5982\u4f55\u6253\u9020\u81ea\u5df1\u7684\u804a\u5929\u673a\u5668\u4eba\u3002<\/span><img      src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma4-1534232146.jpeg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><br  \/><\/p>\n<section style=\"white-space: normal; margin-left: 0.5em; margin-right: 0.5em; letter-spacing: 0.5px;\">\n<section style=\"letter-spacing: 0.5px; margin-left: 0.5em; margin-right: 0.5em;\">\n<section  style=\"letter-spacing: 0.5px; margin-left: 0.5em; margin-right: 0.5em;\">\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px;\"><span style=\"font-size: 13px; letter-spacing: 0.5px;\"><\/span><br  \/><\/p>\n<p style=\"margin: 10px 0.5em; line-height: 2em; letter-spacing: 0.5px; text-align: center;\"><strong><span style=\"color: rgb(123, 12, 0);\">\u63a8\u8350\u9605\u8bfb<\/span><\/strong><\/p>\n<p style=\"letter-spacing: 0.5px; white-space: normal; text-align: center;\"><br  \/><\/p>\n<p style=\"letter-spacing: 0.5px; white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485881&amp;idx=1&amp;sn=5b7aff8a4e824bdbe64f6d6e488dd61b&amp;chksm=e8945334dfe3da22bd31c3cc83f9b1ca25521fa30f6ba3bec28fbcacd69282e769a4da1564cd&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\">\u91cd\u78c5\u8bfe\u7a0b\uff1a\u6253\u9020\u4f60\u81ea\u5df1\u7684\u804a\u5929\u673a\u5668\u4eba | \u674e\u5ae3\u7136<\/a><br  \/><\/p>\n<p style=\"letter-spacing: 0.5px; white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485862&amp;idx=1&amp;sn=e9485916dcb7a3b4b623fe6da6d30dfe&amp;chksm=e894532bdfe3da3d530e70f8a95d25cf8d61a348cd058de71296e82df910f85cb4b6df739a59&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\">\u5982\u4f55\u653b\u7834\u8bed\u97f3\u8bc6\u522b\u6700\u540e\u76843%\uff1f | \u8bfb\u4e66\u4f1a<\/a><br  \/><\/p>\n<p style=\"white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485855&amp;idx=1&amp;sn=e546a3f6023d90909a9ac9a3d3b4658f&amp;chksm=e8945312dfe3da04d4633aed4a4d1f9770a710ef76fc0349fdb2a8b458e56ea72804103b5b7d&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\"><span style=\"font-size: 13px;\">\u4ece\u4e07\u7269\u6709\u7075\u5230AI\u638c\u7ba1\u4e16\u754c\u2014\u2014AI\u89c6\u91ce\uff08\u4e09\uff09<\/span><\/a><\/p>\n<p style=\"white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485723&amp;idx=1&amp;sn=ef60e683e1d9377f0ebc583d761a0066&amp;chksm=e8945396dfe3da808b84c9dcafe65c02920b77847ed3831066a376c01112de6777a476a3de2e&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\"><span style=\"font-size: 13px;\">\u900f\u89c6\u6df1\u5ea6\u5b66\u4e60\uff0c\u7545\u60f3\u672a\u6765\u5e94\u7528\u2014\u2014AI\u89c6\u91ce\uff08\u4e8c\uff09<\/span><\/a><br  \/><\/p>\n<p style=\"white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485677&amp;idx=1&amp;sn=c87541996d9f734390b9c6b2ab9abde5&amp;chksm=e8945260dfe3db76d5839523786f649d4fe7222f7f2a3a35be5775e3dc8d032a4bffb1544eeb&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\"><span style=\"font-size: 13px;\">\u63ea\u7740\u81ea\u5df1\u7684\u5934\u53d1\u79bb\u5f00\u5730\u7403\u2014\u2014AI\u89c6\u91ce\uff08\u4e00\uff09<\/span><\/a><\/p>\n<p style=\"letter-spacing: 0.5px; white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485818&amp;idx=2&amp;sn=e1ee216064c0067b8dd4197fd84469d7&amp;chksm=e89453f7dfe3dae1c6de34769ac00479969066c9e65a0d2fb71ef4cf9af8c3bbe6676c06912d&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\"><span style=\"font-size: 13px;\">AI\u6253\u6e38\u620f\u80cc\u540e\u7684\u6280\u672f\u539f\u7406&nbsp;<\/span><\/a><br  \/><\/p>\n<p style=\"letter-spacing: 0.5px; white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485777&amp;idx=1&amp;sn=66a908e6a0f4cd31afaa698cdd743391&amp;chksm=e89453dcdfe3daca0106b235f3a42b8e99bcf08fa469f525fe7473a74d9768803a0d8b93da0a&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\"><span style=\"font-size: 13px;\">\u770bAlphaGo\u8650\u67ef\u6d01\u4e0d\u723d\uff1f \u90a3\u5c31\u89e3\u5256\u5b83\u4eb2\u54e5\uff01<\/span><\/a><br  \/><\/p>\n<p style=\"letter-spacing: 0.5px; white-space: normal; text-align: center; margin-top: 10px;\"><a href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247485769&amp;idx=1&amp;sn=17928ec512da74b250e356ccba25a750&amp;chksm=e89453c4dfe3dad2a9bc7d73f9957379b15a61ef77c6a4d8b5d680b88cef22f51329ffb13a31&amp;scene=21#wechat_redirect\" target=\"_blank\" style=\"text-decoration: underline; font-size: 13px;\"><span style=\"font-size: 13px;\">\u67ef\u6d01\u8f93\u4e86\uff0c\u6240\u4ee5\u6765\u5b66\u5b66AlphaGo\u80cc\u540e\u7684\u4eba\u5de5\u667a\u80fd<\/span><\/a><\/p>\n<p style=\"letter-spacing: 0.5px; white-space: normal;\"><br  \/><\/p>\n<hr style=\"margin-right: 0.5em; margin-left: 0.5em; white-space: normal; line-height: 25.6px; letter-spacing: 0.5px;\"  \/>\n<p style=\"margin-right: 0.5em; margin-left: 0.5em; white-space: normal; line-height: 25.6px; text-align: center; letter-spacing: 0.5px;\"><img width=\"100%\" class=\"__bg_gif\"     style=\"color: rgb(62, 62, 62); font-size: 16px; background-color: rgb(255, 255, 255); visibility: visible !important; width: 64px !important;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma5-1534232146.gif\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/p>\n<section   style=\"margin-right: 0.5em; margin-left: 0.5em; font-size: 16px; white-space: normal; line-height: 25.6px; color: rgb(62, 62, 62); letter-spacing: 0.5px; background-color: rgb(255, 255, 255);\">\n<section   style=\"margin-right: 0.5em; margin-left: 0.5em; line-height: 25.6px; text-align: center; outline: none;\">\n<section   style=\"margin-right: 0.5em; margin-left: 0.5em; line-height: 25.6px; outline: none;\">\n<section   style=\"outline: none;\">\n<section  style=\"margin-right: 0.5em; margin-left: 0.5em; font-size: 15px; outline: none;\">\n<section  style=\"line-height: 25.6px; border-color: rgb(123, 12, 0);\">\n<p style=\"margin-top: 10px; margin-bottom: 10px; padding-right: 3px; padding-left: 3px; transform: translate3d(0px, 0px, 0px); border-color: rgb(123, 12, 0); line-height: 1.5em;\"><strong><span style=\"font-size: 12px; color: rgb(136, 136, 136);\">\u96c6\u667aQQ\u7fa4\uff5c292641157<br  \/>\u5546\u52a1\u5408\u4f5c\uff5czhangqian@swarma.org<br  \/>\u6295\u7a3f\u8f6c\u8f7d\uff5cwangting@swarma.org<\/span><\/strong><\/p>\n<section   style=\"margin-right: 0.5em; margin-left: 0.5em; outline: none;\">\n<h1 style=\"margin-top: 10px; margin-bottom: 10px; line-height: 1.75em;\"><strong style=\"font-size: 14px; white-space: pre-wrap; color: rgb(0, 112, 192); line-height: 25.6px;\"><strong style=\"line-height: 28px; white-space: normal; color: rgb(61, 170, 214); font-size: 20px;\"><span style=\"font-size: 14px; color: rgb(136, 136, 136);\"><span style=\"color: rgb(255, 76, 0);\">\u25c6&nbsp;<\/span><span style=\"color: rgb(0, 128, 255);\">\u25c6&nbsp;<\/span><span style=\"color: rgb(61, 170, 214);\">\u25c6<\/span><\/span><\/strong><\/strong><\/h1>\n<\/section>\n<p style=\"margin-right: 0.5em; margin-left: 0.5em; font-size: 19px; font-family: \u5fae\u8f6f\u96c5\u9ed1; color: rgb(71, 193, 168); line-height: 23.2727px; overflow-wrap: break-word !important;\"><span style=\"color: rgb(123, 12, 0);\"><strong><span style=\"font-size: 14px;\">\u641c\u7d22\u516c\u4f17\u53f7\uff1a\u96c6\u667a\u4ff1\u4e50\u90e8<\/span><\/strong><\/span><\/p>\n<p style=\"margin-right: 0.5em; margin-left: 0.5em; font-size: 19px; font-family: \u5fae\u8f6f\u96c5\u9ed1; color: rgb(71, 193, 168); line-height: 23.2727px; overflow-wrap: break-word !important;\"><span style=\"color: rgb(0, 0, 0);\"><strong><span style=\"font-size: 14px;\"><br  \/><\/span><\/strong><\/span><\/p>\n<p style=\"margin-right: 0.5em; margin-left: 0.5em; font-size: 19px; font-family: \u5fae\u8f6f\u96c5\u9ed1; color: rgb(71, 193, 168); line-height: 23.2727px; overflow-wrap: break-word !important;\"><span style=\"color: rgb(0, 0, 0);\"><strong><span style=\"font-size: 14px;\">\u52a0\u5165\u201c\u6ca1\u6709\u56f4\u5899\u7684\u7814\u7a76\u6240\u201d<\/span><\/strong><\/span><\/p>\n<section style=\"margin-right: 0.5em; margin-left: 0.5em; font-size: 14px; color: rgb(71, 193, 168); line-height: 20px; overflow-wrap: break-word !important;\">\n<p style=\"margin: 5px auto; padding: 10px; width: 180px; border-width: 2px; border-style: dashed; border-color: rgb(132, 132, 132); line-height: normal; overflow-wrap: break-word !important;\"><img width=\"auto\"      style=\"overflow-wrap: break-word !important; visibility: visible !important; width: auto !important;\" src=\"http:\/\/swarma.org\/wp-content\/uploads\/2018\/08\/swarma1-1534232146.jpeg\" alt=\"\u96c6\u667a\" title=\"\u96c6\u667a\"  \/><\/p>\n<\/section>\n<p><span style=\"font-size: 14px;\">\u8ba9\u82f9\u679c\u7838\u5f97\u66f4\u731b\u70c8\u4e9b\u5427\uff01<\/span><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<blockquote class='keep-source'>\n<p>\u59cb\u53d1\u4e8e\u5fae\u4fe1\u516c\u4f17\u53f7\uff1a                         \u96c6\u667a\u4ff1\u4e50\u90e8                      <\/p>\n<\/blockquote>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>\u5bfc\u8bed \u524d\u4e9b\u65e5\u5b50AlphaGo\u4ee5\u4e00\u201c\u4eba\u201d\u4e4b\u529b\u6a2a\u626b\u4e86\u56fd\u5185\u51e0\u5927\u9876\u5c16\u56f4\u68cb\u9ad8\u624b\u7684\u4e8b\u60c5\uff0c\u76f8\u4fe1\u5728\u6c5f\u6e56\u4e0a\u5df2\u7ecf\u65e0\u4eba\u4e0d\u77e5\u65e0\u4eba\u4e0d\u6653\u4e86\u3002 \u65b0\u95fb\u4e4b\u5916\uff0c\u5982\u679c\u4f60\u5bf9AlphaGo\u7684\u5b9e\u73b0\u6280\u672f\u611f\u5174\u8da3\uff0c\u76f8\u4fe1\u4f60\u4e5f\u5df2\u7ecf\u542c\u8bf4\u8fc7\u201c\u5f3a\u5316\u5b66\u4e60\u201d\u4e86\u3002 AlphaGo\u662f\u4e2a\u5927\u5de5\u7a0b\uff0c\u9664\u4e86\u201c\u5f3a\u5316\u5b66\u4e60\u201d\uff0c\u8fd8\u5229\u7528\u4e86\u201c\u8499\u7279\u5361\u6d1b\u6811\u641c\u7d22\u201d\u7b49\u591a\u79cd\u6280\u672f\uff0c\u4eca\u5929\u6211\u4eec\u4e0d\u53bb\u8bb2\u8fd9\u4e9b&#8230;<\/p>\n","protected":false},"author":1,"featured_media":4740,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[19],"tags":[],"special":[],"_links":{"self":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts\/4739"}],"collection":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=4739"}],"version-history":[{"count":1,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts\/4739\/revisions"}],"predecessor-version":[{"id":4768,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts\/4739\/revisions\/4768"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/media\/4740"}],"wp:attachment":[{"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=4739"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=4739"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=4739"},{"taxonomy":"special","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fspecial&post=4739"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}