{"id":48027,"date":"2024-01-26T17:48:26","date_gmt":"2024-01-26T09:48:26","guid":{"rendered":"https:\/\/swarma.org\/?p=48027"},"modified":"2024-01-26T17:48:26","modified_gmt":"2024-01-26T09:48:26","slug":"yoshua-bengio%e6%bc%94%e8%ae%b2%e3%80%81neurips%e5%af%b9%e9%bd%90%e5%b7%a5%e4%bd%9c%e5%9d%8a%ef%bc%9a%e9%81%bf%e5%85%8dai%e7%81%be%e9%9a%be%e6%80%a7%e9%a3%8e%e9%99%a9%e7%9a%84%e6%8a%80%e6%9c%af","status":"publish","type":"post","link":"https:\/\/swarma.org\/?p=48027","title":{"rendered":"Yoshua Bengio\u6f14\u8bb2\u3001NeurIPS\u5bf9\u9f50\u5de5\u4f5c\u574a\uff1a\u907f\u514dAI\u707e\u96be\u6027\u98ce\u9669\u7684\u6280\u672f\u4e0e\u534f\u8c03\u6311\u6218"},"content":{"rendered":"<div class='wxsyncmain'>\n<section data-tool=\"mdnice\u7f16\u8f91\u5668\" data-website=\"https:\/\/www.mdnice.com\" data-mpa-powered-by=\"yiban.io\">\n<section powered-by=\"xiumi.us\">\n<section>\n<section powered-by=\"xiumi.us\">\n<section powered-by=\"xiumi.us\" style=\"margin-bottom: 0px;outline: 0px;letter-spacing: 0.544px;white-space: normal;color: rgb(63, 63, 63);font-family: PingFangSC-light;font-size: 15px;background-color: rgb(255, 255, 255);visibility: visible;\">\n<section style=\"outline: 0px;display: inline-block;width: 661px;vertical-align: top;background-color: rgb(246, 246, 246);visibility: visible;\">\n<section style=\"outline: 0px;visibility: visible;\">\n<p style=\"outline: 0px;text-align: center;visibility: visible;\"><img class=\"rich_pages wxw-img\" data-backh=\"246\" data-backw=\"578\" data-imgfileid=\"100198328\" data-ratio=\"0.425\"  data-w=\"1080\" style=\"width: 100%;height: auto;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-252506594372d69de8bbd3e7f998b5f0.jpeg\"  \/><\/p>\n<\/section>\n<section powered-by=\"xiumi.us\" style=\"margin-top: 10px;outline: 0px;letter-spacing: 0.544px;visibility: visible;\">\n<section style=\"outline: 0px;width: 661px;visibility: visible;\">\n<section style=\"padding-right: 3px;outline: 0px;float: left;line-height: 1;visibility: visible;\">\n<section powered-by=\"xiumi.us\" style=\"outline: 0px;text-align: left;visibility: visible;\">\n<section style=\"padding-left: 10px;outline: 0px;display: inline-block;width: auto;vertical-align: top;min-width: 10%;height: auto;border-left: 3px solid rgb(33, 166, 210);border-bottom-left-radius: 0px;line-height: 0;visibility: visible;\">\n<section powered-by=\"xiumi.us\" style=\"outline: 0px;transform: translate3d(-13px, 0px, 0px);visibility: visible;\">\n<section style=\"outline: 0px;display: inline-block;width: 25px;height: 10px;vertical-align: top;overflow: hidden;line-height: 0;border-style: solid solid none;border-width: 3px 3px 2px;border-radius: 0px;border-color: rgb(33, 166, 210) rgb(33, 166, 210) rgb(15, 76, 129);visibility: visible;\"><br style=\"outline: 0px;visibility: visible;\"  \/><\/section>\n<\/section>\n<section powered-by=\"xiumi.us\" style=\"outline: 0px;transform: translate3d(-1px, 0px, 0px);visibility: visible;\">\n<section style=\"outline: 0px;text-align: justify;color: rgb(33, 166, 210);font-size: 16px;line-height: 1.5;visibility: visible;\">\n<p style=\"outline: 0px;visibility: visible;\"><strong style=\"outline: 0px;visibility: visible;\">\u5bfc\u8bed<\/strong><\/p>\n<\/section>\n<\/section>\n<section powered-by=\"xiumi.us\" style=\"outline: 0px;transform: translate3d(-13px, 0px, 0px) rotateX(180deg);visibility: visible;\">\n<section style=\"outline: 0px;display: inline-block;width: 24px;height: 10px;vertical-align: top;overflow: hidden;line-height: 0;border-style: solid solid none;border-width: 3px 3px 2px;border-radius: 0px;border-color: rgb(33, 166, 210) rgb(33, 166, 210) rgb(15, 76, 129);visibility: visible;\"><br style=\"outline: 0px;visibility: visible;\"  \/><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"padding-right: 4px;padding-left: 4px;outline: 0px;clear: right;box-shadow: rgb(0, 0, 0) 0px 0px 0px;visibility: visible;min-height: 4.5em !important;\">\n<section powered-by=\"xiumi.us\" style=\"margin-top: 5px;margin-bottom: 5px;outline: 0px;visibility: visible;\">\n<section style=\"padding-right: 8px;padding-left: 8px;outline: 0px;font-size: 13px;line-height: 2;letter-spacing: 0.544px;visibility: visible;\">\n<p style=\"outline: 0px;clear: none;line-height: 2em;visibility: visible;\"><strong style=\"text-indent: 0em;letter-spacing: 0.578px;font-size: 15px;\"><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: 13px;letter-spacing: 0.544px;text-decoration-style: solid;text-decoration-color: rgb(63, 63, 63);\">\u5728 2023 \u5e74 12 \u6708\uff0c\u7b2c\u4e8c\u5c4a AI \u5bf9\u9f50\u5de5\u4f5c\u574a\uff08Alignment Workshop\uff09\u5728\u65b0\u5965\u5c14\u826f\u7684 NeurIPS \u4f1a\u8bae\u671f\u95f4\u4e3e\u529e\u3002\u672c\u6b21\u5de5\u4f5c\u574a\u662f\u7531 Adam Gleave \u9886\u5bfc\u7684\u975e\u76c8\u5229\u6027\u7814\u7a76\u673a\u6784 FAR AI \u4e3b\u529e\u3002<\/span><\/strong><\/p>\n<p style=\"outline: 0px;clear: none;line-height: 2em;visibility: visible;\"><strong style=\"letter-spacing: 0.578px;text-indent: 0em;font-size: 15px;\"><span style=\"font-size: 13px;letter-spacing: 0.544px;text-decoration-style: solid;text-decoration-color: rgb(63, 63, 63);\"><br  \/><\/span><\/strong><\/p>\n<p style=\"outline: 0px;clear: none;line-height: 2em;visibility: visible;\"><strong style=\"letter-spacing: 0.578px;text-indent: 0em;font-size: 15px;\"><span style=\"font-size: 13px;letter-spacing: 0.544px;text-decoration-style: solid;text-decoration-color: rgb(63, 63, 63);\">\u5de5\u4f5c\u574a\u9080\u8bf7\u5230\u4e86\u6765\u81ea\u5de5\u4e1a\u754c\u548c\u5b66\u672f\u754c150\u4f59\u4f4dAI\u7814\u7a76\u8005\u5c31 AI \u5b89\u5168\u548c\u5bf9\u9f50\u76f8\u5173\u7684\u7814\u7a76\u4e3b\u9898\u5c55\u5f00\u8ba8\u8bba\u548c\u8fa9\u8bba\uff0c\u4ece\u800c\u66f4\u597d\u5730\u7406\u89e3\u524d\u6cbf AI \u53ef\u80fd\u5e26\u6765\u7684\u98ce\u9669\uff0c\u5e76\u5bfb\u627e\u964d\u4f4e\u8fd9\u4e9b\u98ce\u9669\u7684\u7b56\u7565\u3002\u5de5\u4f5c\u574a\u7684\u8bb2\u8005\u548c\u53c2\u4e0e\u8005\u6709\u6765\u81eaOpenAI\u3001Anthropic\u3001Google DeepMind\u7b49\u9876\u5c16\u4e1a\u754cAI\u5b9e\u9a8c\u5ba4\u7684AGI\u5b89\u5168\u56e2\u961f\u6210\u5458\uff0c\u4e5f\u6709\u6765\u81eaMIT\u3001UC Berkeley\u3001CMU\u3001\u5251\u6865\u5927\u5b66\u3001\u725b\u6d25\u5927\u5b66\u3001Mila\u7b49\u9876\u5c16\u9ad8\u6821\u7684\u5b66\u8005\u3002\u56fe\u7075\u5956\u5f97\u4e3bYoshua Bengio\u5728\u5de5\u4f5c\u574a\u4e0a\u505a\u4e86\u4e3b\u65e8\u6f14\u8bb2\u3002<\/span><\/strong><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section powered-by=\"xiumi.us\" style=\"margin-top: 10px;outline: 0px;\">\n<section style=\"outline: 0px;width: 661px;\">\n<section style=\"outline: 0px;clear: both;line-height: 0;\">\n<section style=\"outline: 0px;line-height: 0;width: 0px;\"><svg viewbox=\"0 0 1 1\" style=\"vertical-align:top;\"><\/svg><\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section powered-by=\"xiumi.us\" style=\"margin-top: 10px;margin-bottom: 10px;outline: 0px;letter-spacing: 0.544px;white-space: normal;color: rgb(63, 63, 63);font-family: PingFangSC-light;font-size: 15px;background-color: rgb(255, 255, 255);text-align: center;\">\n<section style=\"outline: 0px;vertical-align: middle;display: inline-block;line-height: 0;\"><img class=\"rich_pages wxw-img\" data-fileid=\"100098753\" data-imgfileid=\"100198326\" data-ratio=\"0.07314814814814814\"  data-type=\"png\" data-w=\"1080\" style=\"outline: 0px;vertical-align: middle;visibility: visible !important;width: 677px !important;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-6f9f672988af7db277f019eec3e6e952.png\"  \/><\/section>\n<\/section>\n<section powered-by=\"xiumi.us\" style=\"margin-top: 0pt;margin-bottom: 0pt;outline: 0px;letter-spacing: 0.544px;white-space: normal;line-height: 1.7;font-family: PingFangSC-light;background-color: rgb(255, 255, 255);text-align: right;\">\n<p style=\"outline: 0px;color: rgb(73, 73, 73);font-size: 14.6667px;letter-spacing: 0.544px;visibility: visible;\"><span style=\"outline: 0px;letter-spacing: 0.544px;visibility: visible;font-size: 13px;text-decoration-style: solid;text-decoration-color: rgb(73, 73, 73);\">\u5b89\u8fdcAI<\/span><span style=\"outline: 0px;letter-spacing: 0.544px;font-size: 13px;visibility: visible;\"><strong style=\"outline: 0px;color: rgb(0, 0, 0);visibility: visible;\">&nbsp;| \u6765\u6e90<\/strong><\/span><strong style=\"outline: 0px;font-size: 13px;letter-spacing: 0.544px;color: rgb(0, 0, 0);visibility: visible;\"><\/strong><\/p>\n<p style=\"outline: 0px;font-size: 14.6667px;letter-spacing: 0.544px;visibility: visible;\"><br  \/><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013524\" data-ratio=\"0.600925925925926\"  data-type=\"jpeg\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;width: 412px;height: 248px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-f4bec5191f108afdcd502f5dd8bb3df0.jpeg\"  \/><\/p>\n<p style=\"margin-bottom: 0px;margin-left: 8px;margin-right: 8px;text-align: center;line-height: 1.5em;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u65b0\u5965\u5c14\u826f\u5bf9\u9f50\u5de5\u4f5c\u574a\uff08New Orleans Alignment Workshop\uff09<\/span><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u6574\u4e2a\u5de5\u4f5c\u574a\u6309\u7167AGI\u5b89\u5168\u7684\u7814\u7a76\u65b9\u5411\u5206\u6210\u4e86\u4e94\u4e2a\u4e3b\u9898\uff1a\u5bf9\u9f50\u95ee\u9898\u5bfc\u8bba<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Introducing Alignment Problems\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u76d1\u7763<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Oversight\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u9c81\u68d2\u6027\u548c\u6cdb\u5316<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Robustness and Generalization\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u53ef\u89e3\u91ca\u6027<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Interpretability\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u6cbb\u7406<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Governance\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\uff0c\u4ee5\u4e0b\u662f\u6240\u6709\u8bb2\u8005\u4e0e\u6f14\u8bb2\u4e3b\u9898\u4e00\u89c8<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08\u52a0\u7c97\u4e3a\u957f\u6f14\u8bb2\uff0c\u5176\u4f59\u4e3a\u77ed\u6f14\u8bb2\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\uff1a<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013525\" data-ratio=\"0.6305555555555555\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-acac417b48c4c8b09d051c538564624b.png\"  \/><figcaption><\/figcaption><\/figure>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013527\" data-ratio=\"0.4324074074074074\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-a46a7af8f9ce3ab356f4ca11ac8a9d54.png\"  \/><figcaption><\/figcaption><\/figure>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013526\" data-ratio=\"0.6555555555555556\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-2e230a266b8dcc6c4080806758fe4e31.png\"  \/><\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5b89\u8fdc AI \u7684\u6280\u672f\u9879\u76ee\u7ecf\u7406\u6bb5\u96c5\u6587\u53d7\u9080\u53c2\u4e0e\u4e86\u672c\u6b21\u5de5\u4f5c\u574a\u3002\u672c\u6587\u662f\u5de5\u4f5c\u574a\u603b\u7ed3\u7cfb\u5217\u63a8\u6587\u7684\u7b2c\u4e00\u7bc7\u6587\u7ae0\u3002\u603b\u7ed3\u4e86\u6765\u81eaYoshua Bengio<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Mila\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001Adam Gleave<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08FAR AI\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u548cOwain Evans<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Oxford\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7684\u4e3b\u65e8\u6f14\u8bb2\u3002<\/span><\/section>\n<section style=\"vertical-align: inherit;margin-bottom: 0px;\"><br  \/><\/section>\n<p style=\"vertical-align:inherit;\"><br  \/><\/p>\n<section data-role=\"splitline\" data-tools=\"135\u7f16\u8f91\u5668\" data-id=\"116888\">\n<section style=\"margin: 20px auto;\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100198335\" data-ratio=\"0.035849056603773584\"  data-type=\"png\" data-w=\"530\" data-width=\"100%\" style=\"vertical-align: inherit;width: 100%;display: block;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-d4dc3d8a9371503dc8b186be22ed3958.png\"  \/><\/section>\n<\/section>\n<h1 data-tool=\"mdnice\u7f16\u8f91\u5668\" style=\"line-height: 1.75em;margin-left: 8px;margin-right: 8px;margin-bottom: 0px;\"><strong><span style=\"font-size: 15px;color: rgb(33, 166, 210);\">PART 1 \u4e3b\u65e8\u6f14\u8bb2 &#8211; Yoshua Bengio: Towards Quantitative Safety Guarantees and Alignment<\/span><\/strong><\/h1>\n<section style=\"margin-bottom: 0px;\"><br  \/><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100198337\" data-ratio=\"0.28055555555555556\"  data-type=\"png\" data-w=\"1080\" style=\"margin-right: auto;margin-left: auto;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: var(--articleFontsize);letter-spacing: 0.034em;white-space: normal;display: block;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-7f2ef1722d9ad1a62709eddf14fbd73c.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">Yoshua Bengio: Towards Quantitative Safety Guarantees and Alignment<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5173\u4e8e\u4ec0\u4e48\uff1a\u6df1\u5ea6\u5b66\u4e60\u4e09\u5de8\u5934\u4e4b\u4e00\u3001\u56fe\u7075\u5956\u5f97\u4e3b Yoshua Bengio \u5728\u5de5\u4f5c\u574a\u53d1\u8868\u4e86\u4e3b\u65e8\u6f14\u8bb2\uff0c\u8bb2\u8ff0\u4e86\u4ed6\u5bf9AI\u98ce\u9669\u7684\u6700\u65b0\u7814\u5224\u548c\u4ed6\u6b63\u5728\u5b9e\u8df5\u7684AI\u5b89\u5168\u6280\u672f\u65b9\u5411 &#8211; \u201c\u968f\u7740\u7b97\u529b\u589e\u52a0\u800c\u589e\u5f3a\u7684\u5b89\u5168\u4fdd\u8bc1\u201d\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u98ce\u9669\u7814\u5224\uff1aBengio\u8ba4\u4e3a\u5f53\u524d\u907f\u514dAI\u707e\u96be\u6027\u98ce\u9669\u81f3\u5c11\u5b58\u5728\u7684\u4e24\u4e2a\u6311\u6218\uff1a\uff081\uff09\u89e3\u51b3\u5bf9\u9f50\u4e0e\u63a7\u5236\u6311\u6218\uff1a\u4e00\u4e2a\u6280\u672f\u6311\u6218+\u653f\u6cbb\u6311\u6218\uff08\u9700\u8981\u5927\u91cf\u7684\u5b89\u5168\u9886\u57df\u7684\u7814\u53d1\u6295\u8d44\uff09\uff1b\uff082\uff09\u89e3\u51b3\u534f\u8c03\u6311\u6218\uff1a\u786e\u4fddAI\u7814\u53d1\u8005\u9075\u5faa\u5b89\u5168\u548c\u4f26\u7406\u534f\u8bae\uff0c\u5e76\u4e14\u505a\u51fa\u5e94\u5bf9\u5931\u63a7AI\u7684\u51c6\u5907\u63aa\u65bd\uff0c\u540c\u65f6\u4e5f\u662f\u4e00\u4e2a\u793e\u4f1a\u6280\u672f\u6311\u6218\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013528\" data-ratio=\"0.5625\"  data-type=\"png\" data-w=\"960\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;width: 441px;height: 248px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-a8515b90ff6bc6a81242c8097c9860f5.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u907f\u514dAI\u707e\u96be\u6027\u98ce\u9669\u7684\u4e24\u4e2a\u6311\u6218<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">Bengio\u7684\u6f14\u8bb2\u524d\u534a\u90e8\u5206\u4e3b\u8981\u8bb2\u8ff0\u4e86\u5982\u4f55\u4ece\u6cbb\u7406\u7684\u89c6\u89d2\u89e3\u51b3\u534f\u8c03\u6311\u6218\uff0c\u800c\u540e\u534a\u90e8\u5206\u8bb2\u8ff0\u4e86\u9488\u5bf9\u6280\u672f\u6311\u6218\u7684\u89e3\u51b3\u65b9\u6848\uff0c\u672c\u6587\u5c06\u96c6\u4e2d\u8ba8\u8bba\u6280\u672f\u6311\u6218\u7684\u90e8\u5206\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u98ce\u9669\u6a21\u578b\uff1aBengio\u5728\u8bb2\u5ea7\u4e2d\u5f3a\u8c03\u7684\u98ce\u9669\u6a21\u578b\u4e3b\u8981\u662f\u5956\u52b1\u7834\u89e3<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08reward hacking\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3002\u5047\u8bbe\u6a21\u578b\u4f30\u8ba1\u4e86\u4e00\u4e2a\u4e0d\u5b8c\u7f8e\u7684\u5956\u52b1\u51fd\u6570\uff0c\u5e76\u57fa\u4e8e\u5f3a\u5316\u5b66\u4e60\u7684\u65b9\u6cd5\u5bf9\u5176\u8fdb\u884c\u4f18\u5316\uff0c\u6a21\u578b\u4f1a\u66f4\u6709\u53ef\u80fd\u627e\u5230\u66f4\u5927\u7684\u771f\u5b9e\u5956\u52b1\u51fd\u6570\u548c\u4f30\u8ba1\u5956\u52b1\u51fd\u6570\u7684\u4e0d\u540c<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08mismatch\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013530\" data-ratio=\"0.5583333333333333\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;width: 402px;height: 224px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-286dab732cbdbfd18980f124c2342d93.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u5f3a\u5316\u5b66\u4e60\uff08RL\uff09\u5bfc\u81f4\u7684\u5bf9\u9f50\u5931\u8d25<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5f53\u524d\u7684\u8303\u5f0f\u7684\u7f3a\u9677\u5728\u4e8e\uff1a\u6a21\u578b\u80fd\u529b\u8d8a\u5f3a\uff0c\u6a21\u578b\u8fdb\u884c\u5956\u52b1\u7834\u89e3\u9020\u6210\u707e\u96be\u7684\u80fd\u529b\u4f1a\u8d8a\u5f3a\u3002\u4e3e\u4e2a\u4f8b\u5b50\uff1a\u5982\u679cAI\u80fd\u591f\u201c\u7406\u89e3\u201d\u5956\u52b1\u6765\u6e90\u4e8e\u4eba\u7c7b\u5728\u952e\u76d8\u4e0a\u8f93\u5165+1\u7684\u52a8\u4f5c\uff0c\u90a3\u4e48AI\u5c31\u6709\u7406\u7531\u63a5\u7ba1\u4eba\u7c7b\u7684\u952e\u76d8\u800c\u8f93\u5165\u5f88\u591a+1\u3002\u53e6\u4e00\u4e2a\u65b9\u9762\uff0c\u5047\u8bbeAI\u5b66\u5230\u4e86\u8fd9\u6837\u7684\u7b56\u7565\uff0c\u4e3a\u4e86\u4fdd\u8bc1\u5176\u5956\u52b1\u7684\u6700\u5927\u5316\uff0c\u5b83\u4e5f\u6709\u7406\u7531\u6b3a\u9a97\u4eba\u7c7b\u800c\u4e0d\u5e0c\u671b\u4eba\u7c7b\u53d1\u73b0\u5176\u5b66\u5230\u7684\u7b56\u7565\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013529\" data-ratio=\"0.5625\"  data-type=\"png\" data-w=\"960\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;width: 418px;height: 235px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-0b009fd06f42c8983d3b36a581a729eb.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">RL+\u7b97\u529b\u5982\u4f55\u5bfc\u81f4\u5956\u52b1\u7834\u89e3<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u4e00\u79cd\u5e94\u5bf9\u7684\u65b9\u6cd5\u662f\u300aHuman Compatible\u300b\u7684\u4f5c\u8005Stuart Russell\u63d0\u51fa\u7684\u5408\u4f5c\u9006\u5f3a\u5316\u5b66\u4e60<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Cooperative Inverse RL\uff1bCIRL\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\uff0c\u5373\u4e0d\u53ea\u662f\u5b66\u5230\u5355\u4e00\u5956\u52b1\u51fd\u6570\uff0c\u800c\u662f\u7ed9\u5b9a\u5df2\u6709\u7684\u4fe1\u606f\u5b66\u4e60\u5956\u52b1\u51fd\u6570\u7684\u5206\u5e03\u6765\u4fdd\u6301\u5bf9\u4eba\u7c7b\u504f\u597d\u7684\u4e0d\u786e\u5b9a\u6027\u3002\u8fd9\u6837\u7684\u65b9\u6cd5\u542f\u53d1\u4e86Bengio\u6b63\u5728\u5b9e\u8df5\u7684\u53e6\u4e00\u79cd\u8303\u5f0f\uff1a\u5373\u901a\u8fc7\u5b66\u4e60\u8d1d\u53f6\u65af\u540e\u9a8c<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08posterior\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u6765\u4fdd\u6301\u5bf9\u4e8e\u4e16\u754c\u6a21\u578b\u7684\u4e0d\u786e\u5b9a\u6027\uff0c\u5e76\u5728\u51b3\u7b56\u7684\u65f6\u5019\u9700\u8981\u8003\u8651\u5230\u8fd9\u4e9b\u4e0d\u786e\u5b9a\u6027\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013531\" data-ratio=\"0.5625\"  data-type=\"png\" data-w=\"960\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-7873567017948f64b5063c2c0ba7d15c.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u901a\u8fc7\u5b66\u4e60\u8d1d\u53f6\u65af\u540e\u9a8c\u4fdd\u8bc1\u5b89\u5168<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u4e3e\u4e00\u4e2a\u7b80\u5355\u7684\u4f8b\u5b50\uff1a\u5047\u8bbe\u6211\u4eec\u6709\u4e24\u9053\u95e8\u548c\u89c2\u5bdf\u5230\u7684\u6570\u636e\uff0c\u5b58\u5728\u4e24\u79cd\u201c\u7406\u8bba\u201d\u80fd\u591f\u89e3\u91ca\u8fd9\u7ec4\u6570\u636e\uff1a\u7406\u8bbaA\u662f\u5de6\u95e8\u6709\u6bd2\u53f3\u95e8\u6709\u5956\uff1b\u7406\u8bbaB\u662f\u5de6\u8fb9\u6709\u5956\u53f3\u8fb9\u4e3a\u7a7a\u3002\u6700\u5927\u4f3c\u7136\u7684\u65b9\u6cd5\u53ea\u4f1a\u5b66\u5230\u5176\u4e2d\u4e00\u79cd\u7406\u8bba<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08\u6bd4\u5982\u4e00\u5957\u795e\u7ecf\u7f51\u7edc\u53c2\u6570\u8868\u793a\u7684\u6a21\u578b\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\uff0c\u56e0\u6b64\u53ef\u80fd\u67091\/4\u7684\u6982\u7387\u62bd\u5230\u6bd2\u836f\u3002\u800c\u8d1d\u53f6\u65af\u6a21\u578b\u9700\u8981\u4fdd\u6301\u5bf9\u4e24\u79cd\u7406\u8bba\u7684\u4e0d\u786e\u5b9a\u6027\uff0c\u56e0\u6b64\u6700\u4f18\u7684\u9009\u62e9\u662f\u5f00\u53f3\u95e8\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013532\" data-ratio=\"0.5625\"  data-type=\"png\" data-w=\"960\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-af5837c0a0bfe05e8ebff4279c9df27c.png\"  \/><\/p>\n<p style=\"margin-bottom: 0px;margin-left: 8px;margin-right: 8px;line-height: 1.5em;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">Provable Safety for AI Agent: Rejecting Unsafe Actions with Quantitative Guarantee<\/span><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7ed9\u5b9a\u89c2\u5bdf\u5230\u7684\u6570\u636eD<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u4e0a\u4e0b\u6587 x<\/span><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\"><\/span><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\">\uff0c\u5047\u8bbe\u6211\u4eec\u80fd\u591f\u5b66\u4e60\u5230\u4e00\u4e2a\u597d\u7684\u8d1d\u53f6\u65af\u540e\u9a8c<\/span><img class=\"rich_pages wxw-img\" data-galleryid=\"\" data-imgfileid=\"100198333\" data-ratio=\"0.1323185011709602\" data-s=\"300,640\"  data-type=\"png\" data-w=\"854\" style=\"text-align: center;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: var(--articleFontsize);letter-spacing: 0.034em;width: 144px;height: 20px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-f96a4ea5d40ce7a7ee94695f94d44065.png\"  \/><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\">\uff0c\u4e00\u4e2a\u7b80\u5355\u7684\u4fdd\u8bc1\u5b89\u5168\u7684\u65b9\u6cd5\u662f\u6211\u4eec\u53ef\u4ee5\u5728\u5f53&nbsp;<\/span><img class=\"rich_pages wxw-img\" data-galleryid=\"\" data-imgfileid=\"100198332\" data-ratio=\"0.13387660069848661\" data-s=\"300,640\"  data-type=\"png\" data-w=\"859\" style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: var(--articleFontsize);letter-spacing: 0.034em;text-align: center;width: 152px;height: 20px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-1a146f9b7bb6ce4fd2e2c99dfe933fc0.png\"  \/><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\"><\/span><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\">&nbsp;\u5927\u4e8e\u5b89\u5168\u9608\u503c\u7684\u65f6\u5019\u62d2\u7edd\u8fd9\u4e2a\u884c\u52a8\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\"><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\"><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;font-size: 15px;color: rgb(63, 63, 63);\"><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013533\" data-ratio=\"0.5416666666666666\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-4018bb9a071833d5a0b3f791ebffd0e6.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u5b66\u4e60\u8d1d\u53f6\u65af\u540e\u9a8c\u7684\u6311\u6218<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5f53\u7136\uff0c\u5982\u4f55\u5b66\u5230\u8fd9\u4e2a\u540e\u9a8c\u672c\u8eab\u662f\u4e00\u4e2a\u6311\u6218\uff0c\u7531\u4e8e\u201c\u7406\u8bba\u201d\uff08<span style=\"caret-color: rgb(51, 51, 51);font-family: arial, \u5b8b\u4f53, sans-serif;text-align: start;text-indent: 28px;text-size-adjust: auto;font-size: 15px;letter-spacing: 0.578px;text-decoration: none solid rgb(63, 63, 63);\">\u03b8<\/span>\uff09\u7684\u6570\u91cf\u662f\u6307\u6570\u7684\uff0c\u56e0\u6b64\u5728\u91c7\u6837<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08sampling\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u548c\u8fb9\u7f18\u5316<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08marginalizing\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u90fd\u4f1a\u9047\u5230\u4e0d\u53ef\u76f4\u63a5\u8ba1\u7b97<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08intractable\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7684\u95ee\u9898\u3002<\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013534\" data-ratio=\"0.5625\"  data-type=\"png\" data-w=\"960\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;width: 409px;height: 230px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-bb10c86a7e7d467e014e6a381cfe1934.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">Bengio\u63d0\u51fa\u7684\u8303\u5f0f\uff1a\u66f4\u591a\u7684\u7b97\u529b\u5f97\u5230\u66f4\u9ad8\u7684\u5b89\u5168\u4fdd\u8bc1<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">Bengio\u8ba4\u4e3a\u6b63\u786e\u7684\u8303\u5f0f\u5e94\u8be5\u662f\u80fd\u591f\u901a\u8fc7\u5927\u6a21\u578b\u8fdb\u884c\u644a\u9500\u63a8\u65ad<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08amortized inference\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u903c\u8fd1\u540e\u9a8c\uff0c\u5e76\u4e14\u80fd\u591f\u5728\u7b97\u529b\u589e\u52a0\u7684\u8fc7\u7a0b\u5f53\u4e2d\u66f4\u597d\u5730\u5b66\u4e60\u5230\u8d1d\u53f6\u65af\u540e\u9a8c\u7684\u65b9\u6cd5\u3002\u8fd9\u5c31\u542f\u793a\u4e86Bengio\u56e2\u961f\u81ea\u5df1\u7684\u5de5\u4f5c\u751f\u6210\u6d41\u7f51\u7edc<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08GFlowNet\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7684\u65b9\u6cd5\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013535\" data-ratio=\"0.5611111111111111\"  data-type=\"jpeg\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;width: 345px;height: 194px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-968189a29f38f80c374f164dd7136e19.jpeg\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">GFlowNets \u548c \u8d1d\u53f6\u65af\u540e\u9a8c<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u66f4\u591a\u5185\u5bb9\u53ef\u4ee5\u53c2\u8003Bengio\u7684\u6f14\u8bb2\u89c6\u9891[1]\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<p style=\"vertical-align:inherit;\"><br  \/><\/p>\n<section data-role=\"splitline\" data-tools=\"135\u7f16\u8f91\u5668\" data-id=\"116888\">\n<section style=\"margin: 20px auto;\">\n<section style=\"width: 100%;\" data-width=\"100%\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100198334\" data-ratio=\"0.035849056603773584\"  data-type=\"png\" data-w=\"530\" data-width=\"100%\" style=\"vertical-align: inherit;width: 100%;display: block;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-d4dc3d8a9371503dc8b186be22ed3958.png\"  \/><\/section>\n<\/section>\n<\/section>\n<h1 data-tool=\"mdnice\u7f16\u8f91\u5668\" style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(33, 166, 210);\"><strong>PART 2 Adam Gleave &#8211; AGI Safety: Risks and Research Directions[2]<\/strong><\/span><\/h1>\n<section style=\"margin-bottom: 0px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013537\" data-ratio=\"0.2777777777777778\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-fc05994c52d2a66493db04e67b5d3002.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">AGI Safety: Risks and Research Directions<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u8bb2\u8005\u4ecb\u7ecd\uff1aAdam Gleave \u662f\u975e\u76c8\u5229\u7814\u7a76\u673a\u6784 FAR AI \u7684\u8054\u5408\u521b\u59cb\u4eba\u548c CEO\uff0cFAR AI\u56e2\u961f\u4e3b\u8981\u5173\u6ce8\u7684\u7814\u7a76\u65b9\u5411\u6709\uff1a\u5bf9\u6297\u9c81\u68d2\u6027\u3001\u4ef7\u503c\u5bf9\u9f50\u548c\u5927\u6a21\u578b\u8bc4\u6d4b\u7b49\u3002Adam Gleave \u5728 UC Berkeley\u7684\u4eba\u7c7b\u517c\u5bb9\u4eba\u5de5\u667a\u80fd\u4e2d\u5fc3<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Center for Human-Compatible AI\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5b8c\u6210 AI \u535a\u58eb\u5b66\u4f4d\uff0c\u4ed6\u7684\u5bfc\u5e08\u662f\u8457\u540d\u7684 AI \u7814\u7a76\u8005\u65af\u56fe\u5c14\u7279\u00b7\u7f57\u7d20<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Stuart Russell\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3002Adam\u66fe\u5728 Google DeepMind \u4e0e Jan Leike \u548c Geoffrey Irving \u5408\u4f5c\u8fdb\u884cAI\u5bf9\u9f50\u65b9\u9762\u7684\u7814\u7a76\uff0c\u5e76\u66fe\u5728\u5251\u6865\u5927\u5b66\u4e0e Zoubin Ghahramani \u548c Christian Steinruecken \u5408\u4f5c\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5173\u4e8e\u4ec0\u4e48\uff1a\u6f14\u8bb2\u4ecb\u7ecd\u4e86AGI\u5b89\u5168\u7684\u5386\u53f2\u6cbf\u9769\u548c\u98ce\u9669\u7814\u5224\uff0c\u5e76\u5c06\u6574\u4e2a\u5de5\u4f5c\u574a\u7684\u4e3b\u9898\u5206\u6210\u4e86\u76d1\u7763<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Oversight\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u9c81\u68d2\u6027<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Robustness\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u53ef\u89e3\u91ca\u6027<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Interpretability\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u6cbb\u7406<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Governance\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u56db\u7c7b\u7814\u7a76\u65b9\u5411\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5bf9\u4e8eAI\u98ce\u9669\u7684\u5224\u65ad\uff0cGleave\u5f15\u7528\u4e86Sharkey et al. 2023\u5728\u300aA Causal Framework for AI Regulation and Auditing\u300b\u4e2d\u5bf9\u4e8eAI\u98ce\u9669\u7684\u63cf\u8ff0\uff0c\u5f3a\u8c03\u4e86\u5f53AI\u7cfb\u7edf\u62e5\u6709\u66f4\u5927\u7684\u80fd\u529b\u548c\u66f4\u5e7f\u6cdb\u7684\u6388\u6743<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08affordance\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u65f6\uff0c\u98ce\u9669\u4f1a\u589e\u52a0\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013538\" data-ratio=\"0.562037037037037\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-63c61f7d6a0ca13cf080579a06cc9771.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u5f53AI\u7cfb\u7edf\u62e5\u6709\u66f4\u5927\u7684\u80fd\u529b\u548c\u66f4\u5e7f\u6cdb\u7684\u6388\u6743\uff08affordance\uff09\u65f6\uff0c\u98ce\u9669\u4f1a\u589e\u52a0<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">Gleave\u5f3a\u8c03\u4e86\u4e24\u79cd\u5927\u89c4\u6a21\u98ce\u9669\uff1a\u6ee5\u7528\u98ce\u9669<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08\u6076\u610f\u6216\u9c81\u83bd\u4f7f\u7528AI\u9020\u6210\u4f24\u5bb3\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u4e0e\u5931\u63a7AI<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08AI\u81ea\u4e3b\u8ffd\u6c42\u672a\u5bf9\u9f50\u7684\u76ee\u6807<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\uff09\u5e76\u5217\u51fa\u4e86AGI\u5b89\u5168\u7684\u56db\u4e2a\u7814\u7a76\u65b9\u5411\uff1a\u76d1\u7763<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Oversight\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u9c81\u68d2\u6027<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Robustness\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u53ef\u89e3\u91ca\u6027<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Interpretability\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001\u6cbb\u7406<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Governance\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013539\" data-ratio=\"0.5611111111111111\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;width: 491px;height: 276px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-56bc3045f4312b71cd22c3c077ea50d2.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u4e24\u79cd\u5927\u89c4\u6a21\u98ce\u9669\uff1a\u6ee5\u7528\u98ce\u9669\u548c\u5931\u63a7AI<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013540\" data-ratio=\"0.562037037037037\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-d1574d8a04c0fe4cd9bf9ccd7fb3da0d.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">AGI\u5b89\u5168\u7684\u56db\u4e2a\u7814\u7a76\u65b9\u5411<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<ol data-tool=\"mdnice\u7f16\u8f91\u5668\" class=\"list-paddingleft-1\" style=\"margin-left: 8px;margin-right: 8px;\">\n<li style=\"font-size: 15px;color: rgb(63, 63, 63);\">\n<p style=\"line-height: 1.75em;margin-bottom: 16px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u76d1\u7763<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Oversight\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7814\u7a76\u8bd5\u56fe\u660e\u786e\u7cfb\u7edf\u5e94\u5982\u4f55\u884c\u52a8\u4ee5\u6ee1\u8db3\u8bbe\u8ba1\u8005\u8bbe\u5b9a\u7684\u76ee\u6807\u3002<\/span><\/p>\n<\/li>\n<\/ol>\n<ol start=\"2\" data-tool=\"mdnice\u7f16\u8f91\u5668\" class=\"list-paddingleft-1\" style=\"margin-left: 8px;margin-right: 8px;\">\n<li style=\"font-size: 15px;color: rgb(63, 63, 63);\">\n<p style=\"line-height: 1.75em;margin-bottom: 16px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u9c81\u68d2\u6027<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Robustness\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7814\u7a76\u8bd5\u56fe\u786e\u4fdd\u7cfb\u7edf\u5728\u4e00\u7cfb\u5217\u8bbe\u7f6e\u4e2d\u80fd\u591f\u53ef\u9760\u5730\u6ee1\u8db3\u8bbe\u8ba1\u89c4\u8303\u3002<\/span><\/p>\n<\/li>\n<li style=\"font-size: 15px;color: rgb(63, 63, 63);\">\n<p style=\"line-height: 1.75em;margin-bottom: 16px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u53ef\u89e3\u91ca\u6027<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Interpretability\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7814\u7a76\u8bd5\u56fe\u4f7f\u4eba\u7c7b\u7406\u89e3\u7cfb\u7edf\u7684\u80fd\u529b\u548c\u5c40\u9650\u6027\u3002<\/span><\/p>\n<\/li>\n<li style=\"font-size: 15px;color: rgb(63, 63, 63);\">\n<section style=\"margin-bottom: 0px;line-height: 1.75em;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u6cbb\u7406<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Governance\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7814\u7a76\u8bd5\u56fe\u534f\u8c03\u7cfb\u7edf\u8bad\u7ec3\u548c\u90e8\u7f72\u7684\u5b89\u5168\u6807\u51c6\u3002<\/span><\/section>\n<\/li>\n<\/ol>\n<h1 data-tool=\"mdnice\u7f16\u8f91\u5668\" style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/h1>\n<p style=\"vertical-align:inherit;\"><br  \/><\/p>\n<section data-role=\"splitline\" data-tools=\"135\u7f16\u8f91\u5668\" data-id=\"116888\">\n<section style=\"margin: 20px auto;\">\n<section style=\"width: 100%;\" data-width=\"100%\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100198336\" data-ratio=\"0.035849056603773584\"  data-type=\"png\" data-w=\"530\" data-width=\"100%\" style=\"vertical-align: inherit;width: 100%;display: block;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-d4dc3d8a9371503dc8b186be22ed3958.png\"  \/><\/section>\n<\/section>\n<\/section>\n<h1 data-tool=\"mdnice\u7f16\u8f91\u5668\" style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"color: rgb(33, 166, 210);\"><strong><span style=\"color: rgb(33, 166, 210);font-size: 15px;\">PART 3 Owain Evans &#8211; Out-of-context Reasoning in LLMs[3]<\/span><\/strong><\/span><\/h1>\n<p><span style=\"color: rgb(33, 166, 210);\"><strong><span style=\"color: rgb(33, 166, 210);font-size: 15px;\"><br  \/><\/span><\/strong><\/span><\/p>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013541\" data-ratio=\"0.27870370370370373\"  data-type=\"png\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-663e9f8661ced55e7cdde9d387d15791.png\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">Out-of-context Reasoning in LLMs (Owain Evans)<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u8bb2\u8005\u4ecb\u7ecd\uff1aOwain Evans\u76ee\u524d\u6b63\u5728\u9886\u5bfc\u4e00\u4e2a\u4f4d\u4e8e\u7f8e\u56fd\u52a0\u5dde\u4f2f\u514b\u5229\u7684AI\u5b89\u5168\u7814\u7a76\u7ec4\u3002\u4ed6\u7684\u7814\u7a76\u5174\u8da3\u5305\u62ecAI\u5bf9\u9f50\u548cAGI\u98ce\u9669\u3002\u4ed6\u76ee\u524d\u5173\u6ce8\u5927\u6a21\u578b\u7684\u6001\u52bf\u611f\u77e5<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08situational awareness\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u4e0e\u6b3a\u9a97\u80fd\u529b\uff0c\u4ee5\u53caAI\u7cfb\u7edf\u7684\u771f\u5b9e\u6027\u548c\u8bda\u5b9e\u6027\u3002\u4ed6\u66fe\u5728\u725b\u6d25\u5927\u5b66\u7684\u672a\u6765\u4eba\u7c7b\u7814\u7a76\u6240\u8fdb\u884cAI\u5bf9\u9f50\u7814\u7a76\uff0c\u5e76\u5728MIT\u83b7\u5f97PhD\u5b66\u4f4d\u3002\u4ed6\u5173\u4e8eAI\u5b89\u5168\u7684\u5de5\u4f5c\u5305\u62ec\uff1a\u9006\u8f6c\u8bc5\u5492<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Reversal Curse\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">[4]<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08<\/span><a href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzI3MTA0MTk1MA==&amp;mid=2652381664&amp;idx=1&amp;sn=f0a437cf9cde5d92451bec90bbea9091&amp;scene=21#wechat_redirect\" data-linktype=\"2\" style=\"text-decoration: underline;font-size: 15px;color: rgb(0, 122, 170);\"><span style=\"font-size: 15px;color: rgb(0, 122, 170);\">\u4e2d\u6587\u89e3\u8bfb<\/span><\/a><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3001TruthfulQA\u7b49\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5173\u4e8e\u4ec0\u4e48\uff1aEvans\u5728\u6f14\u8bb2\u4e2d\u7814\u7a76\u7684\u6838\u5fc3\u6982\u5ff5\u53eb\u505a\u201c\u4e0a\u4e0b\u6587\u5916\u63a8\u7406\u201d<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Out-of-context Reasoning\uff1bOOCR\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3002\u8fd9\u79cd\u80fd\u529b\u6307\u7684\u662f\u201c\u5728\u4e0d\u4f7f\u7528\u601d\u7ef4\u94fe<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Chain-of-Thought\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7684\u60c5\u51b5\u4e0b\u8fdb\u884c\u903b\u8f91\u63a8\u7406\u5e76\u5f97\u51fa\u7ed3\u8bba\u7684\u80fd\u529b\u201d\uff0c\u8fd9\u79cd\u63a8\u7406\u65b9\u5f0f\u4e0e\u201c\u4e0a\u4e0b\u6587\u5185\u63a8\u7406\u201d<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08in-context\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u76f8\u5bf9\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013542\" data-ratio=\"0.5657407407407408\"  data-type=\"jpeg\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-fa576fccb91e5fec221de8543d3a5c6b.jpeg\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u201cin-context learning\u201d \u4e0e \u201cout-of-context learning\u201d \u7684\u5bf9\u6bd4<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u4e00\u822c\u6765\u8bf4\u6211\u4eec\u4f1a\u4ee5\u201c\u4e0a\u4e0b\u6587\u5185\u63a8\u7406\u201d<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08in-context\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u7684\u5f62\u5f0f\u4f7f\u7528LLM\u3002\u6211\u4eec\u628a\u4e00\u7cfb\u5217\u524d\u63d0\u6761\u4ef6<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08premises\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u653e\u5728\u4e0a\u4e0b\u6587\u7a97\u53e3\u5185\uff0c\u5e76\u53ef\u80fd\u4f7f\u7528\u601d\u7ef4\u94fe\u63d0\u793a\u6a21\u578b\u5c06\u591a\u6b65\u63a8\u7406\u624d\u80fd\u89e3\u51b3\u7684\u95ee\u9898\u5206\u89e3\u6210\u5355\u6b65\u63a8\u7406\uff0c\u4ee5\u81ea\u7136\u8bed\u8a00\u7684\u5f62\u5f0f\u663e\u5f0f\u5730\u4e00\u6b65\u6b65\u5f97\u5230\u7ed3\u8bba\u3002\u4f46OOCR\u60f3\u8981\u7814\u7a76\u7684\u662f\u628a\u8fd9\u4e9b\u524d\u63d0\u6761\u4ef6\u653e\u5728\u591a\u4e2a\u8bad\u7ec3\u6570\u636e\u4e2d\uff0c\u662f\u5426\u80fd\u5728\u4e0d\u4f7f\u7528\u601d\u7ef4\u94fe\u7684\u60c5\u51b5\u4e0b\u76f4\u63a5\u5f97\u5230\u7ed3\u8bba\uff1f<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u5b9e\u8bc1\u7ed3\u679c\uff1a\u56e2\u961f\u4e8e2023\u5e749\u6708\u53d1\u5e03\u7684\u6587\u7ae0\u300aTaken out of context: On measuring situational awareness in LLMs\u300b[5]\u8bbe\u8ba1\u4e86\u5b9e\u9a8c\u6d4b\u8bd5\u4e86\u5f53\u524d\u6a21\u578b\u7684\u521d\u59cbOOCR\u80fd\u529b\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013543\" data-ratio=\"0.5666666666666667\"  data-type=\"jpeg\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-a2902ff4ed4210ab05e0a17f77cdc259.jpeg\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u300aTaken out of context: On measuring situational awareness in LLMs\u300b<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u53e6\u5916\u4f5c\u8005\u4e5f\u505a\u4e86\u62d3\u5c55\u5b9e\u9a8c\uff0c\u53d1\u73b0\u66f4\u5927\u7684\u6a21\u578b\u503e\u5411\u4e8e\u5728\u8fd9\u4e9b\u9700\u8981 OOCR \u624d\u80fd\u5b8c\u6210\u7684\u4efb\u52a1\u4e0a\u8868\u73b0\u5f97\u66f4\u597d\uff0c\u4f46\u662f\u603b\u4f53\u7684\u63d0\u5347\u76f8\u5bf9\u4e8e\u5176\u4ed6\u6d8c\u73b0\u7684\u80fd\u529b\u8fd8\u4e0d\u8db3\u3002\u591a\u6b65\u63a8\u7406\u76f8\u5bf9\u4e8e\u5355\u6b65\u63a8\u7406\u66f4\u52a0\u56f0\u96be\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013544\" data-ratio=\"0.5888888888888889\"  data-type=\"jpeg\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-d0a0aaba8253148a6e0a669d58180cbe.jpeg\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">OOCR\u80fd\u529b\u7684\u62d3\u5c55\u5b9e\u9a8c<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u56e2\u961f\u8fd8\u53d1\u73b0\u4e00\u4e9b\u7b80\u5355\u7684OOCR\u80fd\u529b\u5904\u4e8e\u5b8c\u5168\u5931\u8d25\u7684\u72b6\u6001\u3002\u4e00\u4e2a\u7ecf\u5178\u7684\u4f8b\u5b50\u662f\u9006\u8f6c\u8bc5\u5492<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08Reversal Curse\uff09\uff08<\/span><a href=\"https:\/\/mp.weixin.qq.com\/s?__biz=MzI3MTA0MTk1MA==&amp;mid=2652381664&amp;idx=1&amp;sn=f0a437cf9cde5d92451bec90bbea9091&amp;scene=21#wechat_redirect\" data-linktype=\"2\" style=\"font-size: 15px;color: rgb(0, 122, 170);text-decoration: underline;\"><span style=\"font-size: 15px;color: rgb(0, 122, 170);\">\u4e2d\u6587\u89e3\u8bfb<\/span><\/a><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3002\u7b80\u5355\u6765\u8bf4\uff0c\u4f5c\u8005\u628aLLM\u5728\u751f\u6210\u7684\u201cA\u662fB\u201d\u7684\u4e8b\u5b9e\u6570\u636e\u4e0a\u5fae\u8c03\uff0c\u7136\u540e\u95eeLLM\u201cB\u662f\u4ec0\u4e48\uff1f\u201d\uff0c\u4f5c\u8005\u53d1\u73b0LLM\u56de\u7b54\u4e0d\u51fa\u6765\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013545\" data-ratio=\"0.5675925925925925\"  data-type=\"jpeg\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-89b871572e37afdffa32975823c03a5d.jpeg\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">\u9006\u8f6c\u8bc5\u5492\uff08Reversal Curse\uff09<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u56e0\u6b64\u4f5c\u8005\u53d1\u73b0\uff1a\u81ea\u56de\u5f52\u7684\u5927\u578b\u8bed\u8a00\u6a21\u578b<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08LLMs\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u4e0d\u80fd\u8fdb\u884c\u4efb\u4f55\u4f9d\u8d56\u4e8e\u53cd\u8f6c\u524d\u63d0\u987a\u5e8f\u7684OOCR\u3002\u5373\u4f7f\u5c1d\u8bd5\u4e86\u6269\u5927\u6a21\u578b\u89c4\u6a21\u3001\u6570\u636e\u589e\u5f3a\u548c\u5176\u4ed6\u65b9\u6cd5\uff0c\u90fd\u6ca1\u6709\u4efb\u4f55\u5e2e\u52a9\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<figure data-tool=\"mdnice\u7f16\u8f91\u5668\"><img class=\"rich_pages wxw-img\" data-imgfileid=\"100013546\" data-ratio=\"0.5675925925925925\"  data-type=\"jpeg\" data-w=\"1080\" style=\"display: block;margin-right: auto;margin-left: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;object-fit: fill;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-2c48b903892fb1422a3efd4f4e07afaf.jpeg\"  \/><\/p>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;text-align: center;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">OOC Reasoning \u4e3a\u4f55\u91cd\u8981\uff1f<\/span><\/section>\n<\/figure>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u4e3a\u4f55\u91cd\u8981\uff1a\u5047\u8bbe\u6a21\u578b\u7684 OOCR \u80fd\u529b\u5f88\u5f3a\uff0c\u5e76\u4e14\u968f\u7740\u6a21\u578b\u89c4\u6a21\u589e\u5927\u800c\u53d8\u5f3a\uff0c\u90a3\u4e48\u672a\u6765\u7684\u6a21\u578b\u53ef\u80fd\u4f1a\u5728\u4e0d\u4f7f\u7528\u601d\u7ef4\u94fe\u7684\u60c5\u51b5\u4e0b\uff0c\u79ef\u7d2f\u65b0\u77e5\u8bc6\u548c\u65b0\u7ed3\u8bba\uff1b\u6a21\u578b\u53ef\u80fd\u4f1a\u79ef\u7d2f\u9690\u85cf\u7684\u7b56\u7565\u548c\u89c4\u5212<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08\u6bd4\u5982\u64cd\u63a7\u548c\u6b3a\u9a97\u4eba\u7c7b\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\uff1b\u6a21\u578b\u4e5f\u53ef\u80fd\u4f1a\u731c\u6d4b\u51fa\u4eba\u7c7b\u4ece\u8bad\u7ec3\u6570\u636e\u4e2d\u6392\u9664\u7684\u4e8b\u5b9e<\/span><span style=\"font-size: 15px;color: rgb(136, 136, 136);\">\uff08\u4f8b\u5982\uff1a\u5982\u4f55\u5236\u9020\u6b66\u5668\u4ee5\u53ca\u5173\u4e8e\u6a21\u578b\u672c\u8eab\u7684\u77e5\u8bc6\uff09<\/span><span style=\"font-size: 15px;color: rgb(63, 63, 63);\">\u3002\u76f8\u53cd\u7684\uff0c\u5982\u679c\u6a21\u578b\u7684 OOCR \u80fd\u529b\u4e0d\u8db3\u4e14\u96be\u4ee5\u62d3\u5c55\uff0c\u90a3\u4e48 LLM \u7684\u77e5\u8bc6\u53ea\u4f1a\u5c40\u9650\u4e8e\u4eba\u7c7b\u7684\u77e5\u8bc6\u3001\u81ea\u84b8\u998f\u548c\u601d\u7ef4\u94fe\u8bbe\u7f6e\u7684\u63a8\u7406\u8fb9\u754c\u3002\u4e3a\u4e86\u4fdd\u8bc1\u5b89\u5168\uff0c\u6211\u4eec\u5c31\u4e5f\u53ef\u4ee5\u7528\u5176\u4ed6\u6a21\u578b\u76d1\u6d4b\u601d\u7ef4\u94fe\u7684\u6b65\u9aa4\u6765\u963b\u6b62\u53ef\u7591\u7684\u6b65\u9aa4\u3002<\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><span style=\"font-size: 15px;color: rgb(63, 63, 63);\"><br  \/><\/span><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><strong><span style=\"font-size: 15px;color: rgb(33, 166, 210);\">\u53c2\u8003\u8d44\u6599<\/span><\/strong><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;text-align: left;line-height: normal;margin-bottom: 8px;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">[1]&nbsp;<\/span><span style=\"color: rgb(136, 136, 136);font-size: 13px;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;\">Yoshua Bengio: Towards Quantitative Safety Guarantees and Alignment: https:\/\/www.alignment-workshop.com\/nola-2023<\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;text-align: left;line-height: normal;margin-bottom: 8px;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">[2]&nbsp;<\/span><span style=\"color: rgb(136, 136, 136);font-size: 13px;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;\">Adam Gleave &#8211; AGI Safety: Risks and Research Directions: https:\/\/w<\/span><span style=\"color: rgb(136, 136, 136);font-size: 13px;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;\">ww.alignment-workshop.com\/nola-talks\/adam-gleave-agi-safety-risks-and-research-directions<\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;text-align: left;line-height: normal;margin-bottom: 8px;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">[3]&nbsp;<\/span><span style=\"color: rgb(136, 136, 136);font-size: 13px;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;\">Owain Evans &#8211; Out-of-context Reasoning in LLMs: https:\/\/www.alignment-workshop.com\/nola-talks\/owain-evans-out-of-context-reasoning-in-llms<\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;text-align: left;line-height: normal;margin-bottom: 8px;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">[4]&nbsp;<\/span><span style=\"color: rgb(136, 136, 136);font-size: 13px;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;\">\u9006\u8f6c\u8bc5\u5492\uff08Reversal Curse\uff09: https:\/\/arxiv.org\/abs\/2309.12288<\/span><\/section>\n<section style=\"margin-left: 8px;margin-right: 8px;text-align: left;line-height: normal;margin-bottom: 8px;\"><span style=\"color: rgb(136, 136, 136);font-size: 13px;\">[5]&nbsp;<\/span><span style=\"color: rgb(136, 136, 136);font-size: 13px;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.034em;\">\u300aTaken out of context: On measuring situational awareness in LLMs\u300b: https:\/\/arxiv.org\/abs\/2309.00667<\/span><\/section>\n<section powered-by=\"xiumi.us\">\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/section>\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/section>\n<section powered-by=\"xiumi.us\" style=\"margin-top: 10px;margin-bottom: 0px;white-space: normal;outline: 0px;color: rgb(136, 136, 136);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;background-color: rgb(255, 255, 255);text-align: center;justify-content: center;\">\n<section style=\"outline: 0px;display: inline-block;width: auto;vertical-align: top;min-width: 10%;height: auto;box-shadow: rgb(0, 0, 0) 0px 0px 0px;border-bottom: 9px solid rgb(169, 215, 227);border-bottom-right-radius: 0px;\">\n<section powered-by=\"xiumi.us\" style=\"margin-bottom: -15px;outline: 0px;\">\n<section style=\"padding-right: 10px;padding-left: 10px;outline: 0px;color: rgb(12, 130, 169);font-size: 16px;line-height: 2;letter-spacing: 3px;\">\n<p style=\"outline: 0px;\"><strong style=\"outline: 0px;\">\u6d3b\u52a8\u9884\u544a<\/strong><\/p>\n<\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;white-space: normal;outline: 0px;color: rgb(136, 136, 136);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;background-color: rgb(255, 255, 255);line-height: 1.75em;\"><br  \/><\/p>\n<section class=\"channels_iframe_wrp\"><mp-common-videosnap class=\"js_uneditable custom_select_card channels_live_iframe\" data-pluginname=\"mpvideosnap\" data-headimgurl=\"https:\/\/wx.qlogo.cn\/finderhead\/PdibpV1sFDHdC5AR6SqCNbOfwAEdPtWSb2Y5v1iaq3YTCocFBPFM1xzQ\/0\" data-username=\"v2_060000231003b20faec8c4e78d10c3d6cd04ef30b077c6436f3ed47f70be822497426f6452dd@finder\" data-nickname=\"\u96c6\u667a\u4ff1\u4e50\u90e8\" data-desc=\"\u5c06\u572801\u670827\u65e5 10:00 \u76f4\u64ad\" data-livewording=\"\u9884\u7ea6\" data-intro=\"\u524d\u6cbf\u62a5\u544a+\u5706\u684c\u5bf9\u8c08\uff1a\u5927\u6a21\u578b\u98ce\u9669\u4e0e\u524d\u6cbf\u7814\u7a76\u65b9\u5411&lt;br&gt;&lt;br&gt;\u4e3b\u8bb2\uff1aAdam Gleave\uff0cFar AI&lt;br&gt;\u5609\u5bbe\uff1a\u6768\u8000\u4e1c\u3001\u82cf\u709c\u6770\u3001\u5218\u9e4f\u98de\" data-type=\"live\" data-status=\"0\" data-noticeid=\"finderlivenotice-v2_060000231003b20faec8c4e78d10c3d6cd04ef30b077c6436f3ed47f70be822497426f6452dd@finder-1706089935780774-520110641\" data-isdisabled=\"0\" data-errortips=\"\"><\/mp-common-videosnap><\/section>\n<section style=\"text-align: center;margin-left: 8px;margin-right: 8px;\"><img class=\"rich_pages wxw-img\" data-galleryid=\"\" data-imgfileid=\"100198323\" data-ratio=\"3.388888888888889\" data-s=\"300,640\"  data-type=\"png\" data-w=\"1080\" style=\"\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-af2615fcccec4246e572a1ddbcd1c741.png\"  \/><\/section>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;outline: 0px;color: rgb(136, 136, 136);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);line-height: 1.75em;\"><br  \/><\/p>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;outline: 0px;color: rgb(136, 136, 136);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);line-height: 2em;\"><span style=\"outline: 0px;font-size: 15px;\"><\/span><\/section>\n<p style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;text-size-adjust: auto;line-height: 2em;\"><span style=\"font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;letter-spacing: 0.578px;background-color: rgb(255, 255, 255);outline: 0px;font-size: 15px;\">\u5927\u6a21\u578b\u7684\u72c2\u98d9\u7a81\u8fdb\u5524\u9192\u4e86\u4eba\u4eec\u5bf9AI\u6280\u672f\u7684\u70ed\u60c5\u548c\u61a7\u61ac\uff0c\u4e5f\u5f15\u53d1\u4e86\u5bf9AI\u6280\u672f\u672c\u8eab\u5b58\u5728\u7684\u793e\u4f1a\u4f26\u7406\u98ce\u9669\u53ca\u5176\u5bf9\u4eba\u7c7b\u751f\u5b58\u6784\u6210\u7684\u6f5c\u5728\u5a01\u80c1\u7684\u666e\u904d\u62c5\u5fe7\u3002\u5728\u6b64\u80cc\u666f\u4e0b\uff0cAI\u5b89\u5168\u4e0e\u5bf9\u9f50\u5f97\u5230\u5e7f\u6cdb\u5173\u6ce8\uff0c\u8fd9\u662f\u4e00\u4e2a\u81f4\u529b\u4e8e\u8ba9AI\u9020\u798f\u4eba\u7c7b\uff0c\u907f\u514dAI\u6a21\u578b\u5931\u63a7\u6216\u88ab\u6ee5\u7528\u800c\u5bfc\u81f4\u707e\u96be\u6027\u540e\u679c\u7684\u7814\u7a76\u65b9\u5411\u3002\u96c6\u667a\u4ff1\u4e50\u90e8\u548c\u5b89\u8fdcAI\u8054\u5408\u4e3e\u529e<a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247679496&amp;idx=1&amp;sn=2f889356c9fcf6fb460dcd87f05036af&amp;chksm=e8996485dfeeed937ca8c59e909b6c991d2ff1cbd132117a91bf54acf9e6205bd0ab2a9e4fb2&amp;scene=21#wechat_redirect\" textvalue=\"\u300cAI\u5b89\u5168\u4e0e\u5bf9\u9f50\u300d\u8bfb\u4e66\u4f1a\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"0\" tab=\"innerlink\" data-linktype=\"2\" rel=\"noopener noreferrer\">\u300cAI\u5b89\u5168\u4e0e\u5bf9\u9f50\u300d\u8bfb\u4e66\u4f1a<\/a>\uff0c\u7531\u591a\u4f4d\u6d77\u5185\u5916\u4e00\u7ebf\u7814\u7a76\u8005\u8054\u5408\u53d1\u8d77\uff0c\u65e8\u5728\u6df1\u5165\u63a2\u8ba8AI\u5b89\u5168\u4e0e\u5bf9\u9f50\u6240\u6d89\u53ca\u7684\u6838\u5fc3\u6280\u672f\u3001\u7406\u8bba\u67b6\u6784\u3001\u89e3\u51b3\u8def\u5f84\u4ee5\u53ca\u5b89\u5168\u6cbb\u7406\u7b49\u4ea4\u53c9\u8bfe\u9898\u3002<\/span><\/p>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;line-height: 1.75em;\"><span style=\"outline: 0px;font-size: 15px;color: rgb(63, 63, 63);\"><strong style=\"outline: 0px;\"><br style=\"outline: 0px;\"  \/><\/strong><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;line-height: 1.75em;text-align: center;\"><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247679496&amp;idx=1&amp;sn=2f889356c9fcf6fb460dcd87f05036af&amp;chksm=e8996485dfeeed937ca8c59e909b6c991d2ff1cbd132117a91bf54acf9e6205bd0ab2a9e4fb2&amp;scene=21#wechat_redirect\" textvalue=\"\u4f60\u5df2\u9009\u4e2d\u4e86\u6dfb\u52a0\u94fe\u63a5\u7684\u5185\u5bb9\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"0\" tab=\"innerlink\" data-linktype=\"1\" hasload=\"1\" rel=\"noopener noreferrer\"><span class=\"js_jump_icon h5_image_link\" style=\"outline: 0px;vertical-align: bottom;user-select: none;width: 100%;\"><img class=\"rich_pages wxw-img\" data-backh=\"321\" data-backw=\"562\" data-cropselx1=\"0\" data-cropselx2=\"562\" data-cropsely1=\"0\" data-cropsely2=\"321\" data-imgfileid=\"100198338\" data-ratio=\"0.5714285714285714\"  data-type=\"jpeg\" data-w=\"1050\" style=\"outline: 0px;border-width: 0px;border-style: initial;border-color: initial;width: 100%;visibility: visible !important;height: auto;\" src=\"\/wp-content\/uploads\/2024\/01\/wxsync-2024-01-f82aba1c2ddede06944d958daa35bf49.png\"  \/><\/span><\/a><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;line-height: 1.75em;\"><br  \/><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;line-height: 1.75em;\"><br  \/><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;line-height: 1.75em;\"><span style=\"outline: 0px;color: rgb(63, 63, 63);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: 15px;letter-spacing: 0.544px;\">\u8be6\u60c5\u8bf7\u89c1\uff1a<\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;line-height: 1.75em;\"><span style=\"font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;outline: 0px;color: rgb(63, 63, 63);font-size: 15px;letter-spacing: 0.578px;text-decoration: underline;\"><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247679496&amp;idx=1&amp;sn=2f889356c9fcf6fb460dcd87f05036af&amp;chksm=e8996485dfeeed937ca8c59e909b6c991d2ff1cbd132117a91bf54acf9e6205bd0ab2a9e4fb2&amp;scene=21#wechat_redirect\" textvalue=\"2024\u5f00\u5e74\u8bfb\u4e66\u4f1a\uff1aAI\u5b89\u5168\u4e0e\u5bf9\u9f50\u2014\u2014\u5e94\u5bf9\u524d\u6cbfAI\u5931\u63a7\u4e0e\u6ee5\u7528\u7684\u6280\u672f\u8def\u7ebf\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"0\" tab=\"innerlink\" data-linktype=\"2\" rel=\"noopener noreferrer\">2024\u5f00\u5e74\u8bfb\u4e66\u4f1a\uff1aAI\u5b89\u5168\u4e0e\u5bf9\u9f50\u2014\u2014\u5e94\u5bf9\u524d\u6cbfAI\u5931\u63a7\u4e0e\u6ee5\u7528\u7684\u6280\u672f\u8def\u7ebf<\/a><\/span><span style=\"outline: 0px;color: rgb(63, 63, 63);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;font-size: 15px;letter-spacing: 0.544px;\"><br  \/><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 0px;margin-left: 8px;color: rgb(136, 136, 136);font-size: 14px;letter-spacing: 0.544px;white-space: normal;background-color: rgb(255, 255, 255);outline: 0px;font-family: system-ui, -apple-system, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;line-height: 1.75em;\"><br  \/><\/section>\n<\/section>\n<section powered-by=\"xiumi.us\">\n<section>\n<section powered-by=\"xiumi.us\">\n<section powered-by=\"xiumi.us\" style=\"margin-bottom: 0px;outline: 0px;letter-spacing: 0.544px;white-space: normal;color: rgb(136, 136, 136);font-size: 14px;background-color: rgb(255, 255, 255);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;\">\n<section powered-by=\"xiumi.us\" style=\"outline: 0px;letter-spacing: 0.544px;\">\n<p style=\"margin-right: 8px;margin-bottom: 5px;margin-left: 8px;outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;color: rgb(0, 0, 0);font-size: 16px;text-align: center;font-family: mp-quote, -apple-system-font, BlinkMacSystemFont, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;\"><strong style=\"outline: 0px;text-align: left;color: rgb(33, 166, 210);font-family: PingFangSC-light;letter-spacing: 0.544px;\"><span style=\"outline: 0px;font-size: 15px;letter-spacing: 0.544px;\">\u63a8\u8350\u9605\u8bfb<\/span><\/strong><\/strong><\/p>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;\">1.&nbsp;&nbsp;<\/strong><span style=\"text-decoration: underline;\"><strong style=\"outline: 0px;\"><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247679853&amp;idx=1&amp;sn=1ea872fcd9ba2bf1bd5ac217484d0a3b&amp;chksm=e89965e0dfeeecf60e4b530bc2ad6b1a68a83bfd2ed1f6d715792811adf2b2ec0e5fee7e09c4&amp;scene=21#wechat_redirect\" textvalue=\"\u5927\u6a21\u578b\u5b89\u5168\u4e0e\u5bf9\u9f50\uff1a\u590d\u6742\u7cfb\u7edf\u89c6\u89d2\u4e0b\u7684AI\u5b89\u5168\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"0\" tab=\"innerlink\" data-linktype=\"2\" rel=\"noopener noreferrer\">\u5927\u6a21\u578b\u5b89\u5168\u4e0e\u5bf9\u9f50\uff1a\u590d\u6742\u7cfb\u7edf\u89c6\u89d2\u4e0b\u7684AI\u5b89\u5168<\/a><\/strong><\/span><strong style=\"outline: 0px;\"><\/strong><strong style=\"outline: 0px;\"><\/strong><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;\">2.&nbsp;<\/strong><span style=\"text-decoration: underline;\"><strong style=\"outline: 0px;\"><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247677327&amp;idx=2&amp;sn=a7bc9861fce673708e659807bf8ff325&amp;chksm=e8996f02dfeee6141faedeccef5d48efb424fe076be79d292d0f8b9091bb21eec9bb33199b2e&amp;scene=21#wechat_redirect\" textvalue=\"\u4e07\u5b57\u957f\u6587\u8be6\u89e3\uff1a\u5927\u6a21\u578b\u65f6\u4ee3AI\u4ef7\u503c\u5bf9\u9f50\u7684\u95ee\u9898\u3001\u5bf9\u7b56\u548c\u5c55\u671b\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"11\" tab=\"innerlink\" data-linktype=\"2\" rel=\"noopener noreferrer\">\u4e07\u5b57\u957f\u6587\u8be6\u89e3\uff1a\u5927\u6a21\u578b\u65f6\u4ee3AI\u4ef7\u503c\u5bf9\u9f50\u7684\u95ee\u9898\u3001\u5bf9\u7b56\u548c\u5c55\u671b<\/a><\/strong><\/span><strong style=\"outline: 0px;\"><\/strong><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\">3.&nbsp;<\/strong><span style=\"text-decoration: underline;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247659365&amp;idx=1&amp;sn=d90cd2b209b6da9eefeb32b7e450e4ba&amp;chksm=e89935e8dfeebcfe7f8fdfd9d1192a54004a95c48c8e94d37d17b3718dad647ec3862a6e58ea&amp;scene=21#wechat_redirect\" textvalue=\"AI\u4f55\u4ee5\u6d8c\u73b0\uff1a\u590d\u6742\u9002\u5e94\u7cfb\u7edf\u89c6\u89d2\u7684ChatGPT\u548c\u5927\u8bed\u8a00\u6a21\u578b\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"0\" tab=\"innerlink\" data-linktype=\"2\" rel=\"noopener noreferrer\">AI\u4f55\u4ee5\u6d8c\u73b0\uff1a\u590d\u6742\u9002\u5e94\u7cfb\u7edf\u89c6\u89d2\u7684ChatGPT\u548c\u5927\u8bed\u8a00\u6a21\u578b<\/a><\/strong><\/span><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><\/strong><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;outline: 0px;letter-spacing: 0.544px;\"><span style=\"outline: 0px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\">4.&nbsp;<\/strong><\/span><span style=\"outline: 0px;text-decoration: underline;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247667315&amp;idx=1&amp;sn=fca3a09806e753fa83d3fd6eb8ccf9d8&amp;chksm=e89914fedfee9de82ae7107592b173d2a1c35141fab0006d3eac2dcb2dd1e74aa78a86e09a93&amp;scene=21#wechat_redirect\" textvalue=\"\u5f20\u6c5f\uff1a\u7b2c\u4e09\u4ee3\u4eba\u5de5\u667a\u80fd\u6280\u672f\u57fa\u7840\u2014\u2014\u4ece\u53ef\u5fae\u5206\u7f16\u7a0b\u5230\u56e0\u679c\u63a8\u7406 | \u96c6\u667a\u5b66\u56ed\u5168\u65b0\u8bfe\u7a0b\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"0\" tab=\"innerlink\" data-linktype=\"2\" hasload=\"1\" style=\"outline: 0px;color: var(--weui-LINK);cursor: pointer;\" rel=\"noopener noreferrer\">\u5f20\u6c5f\uff1a\u7b2c\u4e09\u4ee3\u4eba\u5de5\u667a\u80fd\u6280\u672f\u57fa\u7840\u2014\u2014\u4ece\u53ef\u5fae\u5206\u7f16\u7a0b\u5230\u56e0\u679c\u63a8\u7406 | \u96c6\u667a\u5b66\u56ed\u5168\u65b0\u8bfe\u7a0b<\/a><\/strong><\/strong><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 8px;margin-left: 8px;outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\">5.&nbsp;<\/strong><span style=\"outline: 0px;text-decoration: underline;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;\"><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzI0MjY5NTM2MQ==&amp;mid=2247508039&amp;idx=1&amp;sn=b9e492efd41fab0c2fa3ff4eb092c1f4&amp;chksm=e97a8de9de0d04ffabc439f22170122154bb9c4655cbf957bb5325258661059ef436dd8ce14f&amp;scene=21#wechat_redirect\" textvalue=\"\u52a0\u5165\u96c6\u667a\u5b66\u56edVIP\uff0c\u4e00\u6b21\u6027\u83b7\u53d6\u96c6\u667a\u5e73\u53f0\u6240\u6709\u5185\u5bb9\u8d44\u6e90\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"11\" tab=\"innerlink\" data-linktype=\"2\" hasload=\"1\" style=\"outline: 0px;color: var(--weui-LINK);cursor: pointer;\" rel=\"noopener noreferrer\">\u52a0\u5165\u96c6\u667a\u5b66\u56edVIP\uff0c\u4e00\u6b21\u6027\u83b7\u53d6\u96c6\u667a\u5e73\u53f0\u6240\u6709\u5185\u5bb9\u8d44\u6e90<\/a><\/strong><\/strong><\/strong><\/strong><\/span><\/section>\n<section style=\"margin-right: 8px;margin-bottom: 10px;margin-left: 8px;outline: 0px;letter-spacing: 0.544px;\"><strong style=\"outline: 0px;\">6.&nbsp;<\/strong><a target=\"_blank\" href=\"http:\/\/mp.weixin.qq.com\/s?__biz=MzIzMjQyNzQ5MA==&amp;mid=2247667297&amp;idx=2&amp;sn=988b7314df45d949e69e81257801fff2&amp;chksm=e89914ecdfee9dfac76f9245fb1fd0e5b25d567e20790fbdab671234588ad0e88e1acf205711&amp;scene=21#wechat_redirect\" textvalue=\"\u52a0\u5165\u96c6\u667a\uff0c\u4e00\u8d77\u200d\u590d\u6742\uff01\" linktype=\"text\" imgurl=\"\" imgdata=\"null\" data-itemshowtype=\"0\" tab=\"innerlink\" data-linktype=\"2\" hasload=\"1\" style=\"outline: 0px;color: var(--weui-LINK);cursor: pointer;\" rel=\"noopener noreferrer\"><span style=\"outline: 0px;text-decoration: underline;\"><strong style=\"outline: 0px;\">\u52a0\u5165\u96c6\u667a\uff0c\u4e00\u8d77\u590d\u6742\uff01<\/strong><\/span><\/a><\/section>\n<\/section>\n<p style=\"margin-right: 8px;margin-bottom: 5px;margin-left: 8px;outline: 0px;\"><br style=\"outline: 0px;\"  \/><\/p>\n<\/section>\n<p style=\"margin-bottom: 0px;outline: 0px;letter-spacing: 0.544px;white-space: normal;color: rgb(136, 136, 136);font-size: 14px;background-color: rgb(255, 255, 255);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;\"><br style=\"outline: 0px;\"  \/><\/p>\n<section style=\"margin-bottom: 0px;outline: currentcolor none 0px;letter-spacing: 0.544px;white-space: normal;color: rgb(136, 136, 136);font-size: 14px;background-color: rgb(255, 255, 255);font-family: -apple-system-font, system-ui, &quot;Helvetica Neue&quot;, &quot;PingFang SC&quot;, &quot;Hiragino Sans GB&quot;, &quot;Microsoft YaHei UI&quot;, &quot;Microsoft YaHei&quot;, Arial, sans-serif;\"><strong style=\"outline: 0px;letter-spacing: 0.544px;font-size: 15px;text-align: left;color: rgb(255, 255, 255);font-family: PingFangSC-light;\"><span style=\"outline: 0px;background-color: rgb(12, 130, 169);\">\u70b9\u51fb\u201c\u9605\u8bfb\u539f\u6587\u201d\uff0c\u62a5\u540d\u8bfb\u4e66\u4f1a<\/span><\/strong><\/section>\n<\/section>\n<\/section>\n<section>\n<section powered-by=\"xiumi.us\">\n<section style=\"margin-bottom: 0px;line-height: 1.75em;margin-left: 8px;margin-right: 8px;\"><br  \/><\/section>\n<\/section>\n<\/section>\n<\/section>\n<p style=\"display: none;\"><mp-style-type data-value=\"3\"><\/mp-style-type><\/p>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>\u5bfc\u8bed \u5728 2023 \u5e74 12 \u6708\uff0c\u7b2c\u4e8c\u5c4a AI \u5bf9\u9f50\u5de5\u4f5c\u574a\uff08Alignment Workshop\uff09\u5728\u65b0\u5965\u5c14\u826f\u7684 NeurIPS \u4f1a\u8bae\u671f\u95f4\u4e3e\u529e\u3002\u672c\u6b21\u5de5\u4f5c\u574a\u662f\u7531 Adam Gleave \u9886\u5bfc\u7684\u975e\u76c8\u5229\u6027\u7814\u7a76\u673a\u6784 FAR AI \u4e3b\u529e\u3002 \u5de5\u4f5c\u574a\u9080\u8bf7\u5230\u4e86\u6765\u81ea\u5de5\u4e1a\u754c\u548c\u5b66\u672f\u754c150\u4f59\u4f4dAI\u7814\u7a76\u8005\u5c31 AI \u5b89\u5168\u548c\u5bf9\u9f50&#8230;<\/p>\n","protected":false},"author":0,"featured_media":47992,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[1],"tags":[],"special":[],"_links":{"self":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts\/48027"}],"collection":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/types\/post"}],"replies":[{"embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=48027"}],"version-history":[{"count":0,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/posts\/48027\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=\/wp\/v2\/media\/47992"}],"wp:attachment":[{"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=48027"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=48027"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=48027"},{"taxonomy":"special","embeddable":true,"href":"https:\/\/swarma.org\/index.php?rest_route=%2Fwp%2Fv2%2Fspecial&post=48027"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}