{"id":553797,"date":"2022-02-02T14:42:53","date_gmt":"2022-02-02T06:42:53","guid":{"rendered":"http:\/\/4563.org\/?p=553797"},"modified":"2022-02-02T14:42:53","modified_gmt":"2022-02-02T06:42:53","slug":"%e6%b1%89%e8%af%ad%e5%8f%a4%e6%96%87%e6%96%ad%e5%8f%a5%e9%a2%84%e8%ae%ad%e7%bb%83%e6%a8%a1%e5%9e%8b-5","status":"publish","type":"post","link":"http:\/\/4563.org\/?p=553797","title":{"rendered":"\u6c49\u8bed\u53e4\u6587\u65ad\u53e5\u9884\u8bad\u7ec3\u6a21\u578b"},"content":{"rendered":"<div>\n<div>\n<div>\n<h1> \u6c49\u8bed\u53e4\u6587\u65ad\u53e5\u9884\u8bad\u7ec3\u6a21\u578b <\/h1>\n<p> <\/p>\n<div>\n<div> <span>\u8cc7\u6df1\u5927\u4f6c : oopus <\/span>  <span><i><\/i> 34<\/span> <\/div>\n<div> <\/div>\n<\/p><\/div>\n<\/p><\/div>\n<\/p><\/div>\n<div isfirst=\"1\"> <\/p>\n<p>https:\/\/github.com\/cbdb-project\/sentence-segmentation-for-chinese-historical-texts<\/p>\n<p>\u8fd9\u662f\u57fa\u4e8e LSTM \u7684\u9884\u8bad\u7ec3\u6a21\u578b\u3002\u6b64\u6a21\u578b\u53ef\u5e2e\u52a9\u60a8\u4e3a\u6c49\u8bed\u53e4\u6587\u65ad\u53e5\u3002\u4efb\u4f55\u4eba\u90fd\u53ef\u4ee5\u5728 CC BY-NC-SA 4.0 \u8bb8\u53ef\u8bc1\u4e0b\u4f7f\u7528\u6b64\u9884\u8bad\u7ec3\u6a21\u578b\u3002<\/p>\n<p>\u6211\u4eec\u5728 2018 \u5e74\u5efa\u7acb\u6b64\u6a21\u578b\u3002(Xu Han, Hongsu Wang, Sanqian Zhang, Qunchao Fu, and Jun S Liu. 2018. \u201cSentence Segmentation for Classical Chinese Based on LSTM with Radical Embedding.\u201d)\u867d\u7136\u6a21\u578b\u5df2\u5f88\u8001\u65e7\uff0c\u6211\u4eec\u53d1\u73b0\u5f53\u524d\u5e76\u6ca1\u6709\u9879\u76ee\u5728 GitHub \u4e0a\u516c\u5f00\u7528\u4e8e\u6c49\u8bed\u53e4\u6587\u65ad\u53e5\u7684\u9884\u8bad\u7ec3\u6a21\u578b\u3002\u56e0\u6b64\u6211\u4eec\u8ba4\u4e3a\u5b83\u4ecd\u80fd\u5e2e\u5230\u4e00\u4e9b\u9879\u76ee\u3002<\/p>\n<p>\u6b64\u4ed3\u5e93\u5e76\u4e0d\u662f\u4efb\u4f55\u5f53\u4e0b\u65ad\u53e5\u6216\u8005\u6807\u70b9\u7cfb\u7edf\u7684\u7ade\u4e89\u8005\u3002\u5982\u679c\u60a8\u6709\u8d44\u91d1\u652f\u6301\u6216\u8005\u6709\u5176\u4ed6\u9009\u62e9\uff0c\u8bf7\u9009\u62e9\u90a3\u4e9b\u5f53\u4e0b\u7684\u5546\u4e1a\u5316\u65ad\u53e5\u3001\u6807\u70b9\u6a21\u578b\uff0c\u6216\u5229\u7528\u81ea\u5df1\u7684\u8d44\u6e90\u8bad\u7ec3\u5408\u9002\u7684\u300c\u73b0\u4ee3\u300d\u6a21\u578b\u3002<\/p>\n<p>\u6b64\u4ed3\u5e93\u4ec5\u5e0c\u671b\u4e3a\u4ee5\u4e0b\u9879\u76ee\u3001\u5b66\u8005\u3001\u7231\u597d\u8005\u63d0\u4f9b\u5e2e\u52a9\uff1a1 \uff09\u5e0c\u671b\u6807\u8bb0\u6210\u5343\u4e0a\u4e07\u6761\u8bed\u6599\u8bb0\u5f55\uff0c\u7814\u7a76\u7ed3\u8bba\u5bf9\u6807\u70b9\u6b63\u786e\u7387\u5bb9\u5fcd\u5ea6\u9ad8\u30022 \uff09\u65e0\u6cd5\u5efa\u7acb\u81ea\u5df1\u7684\u53e4\u6c49\u8bed\u65ad\u53e5\u3001\u6807\u70b9\u6a21\u578b\u30023 \uff09\u65e0\u529b\u652f\u4ed8\u4ed8\u8d39\u6a21\u578b\u3002<\/p>\n<p>\u5728\u672c\u4ed3\u5e93\u7684 training-data\/ \u76ee\u5f55\u4e0b\uff0c\u60a8\u53ef\u4ee5\u627e\u5230\u6211\u4eec\u7528\u4e8e\u8bad\u7ec3\u6b64\u6a21\u578b\u7684\u8bed\u6599\u3002\u5982\u679c\u5e0c\u671b\u5e2e\u52a9\u4e0a\u8ff0\u9879\u76ee\u3001\u5b66\u8005\u3001\u7231\u597d\u8005\uff0c\u60a8\u4ea6\u53ef\u57fa\u4e8e\u8fd9\u4e9b\u8bad\u7ec3\u96c6\u8bad\u7ec3\u81ea\u5df1\u7684\u6a21\u578b\uff0c\u6216\u4e30\u5bcc\u8bad\u7ec3\u96c6\u7684\u5185\u5bb9\u3002\u6211\u4eec\u6b22\u8fce\u4efb\u4f55\u4eba\u5411\u672c\u4ed3\u5e93\u63d0\u4ea4\u4ee3\u7801\u6216\u65e0\u7248\u6743\u95ee\u9898\u7684\u8bed\u6599\u3002\u6211\u4eec\u671f\u5f85\u5728\u4e2d\u56fd\u5386\u53f2\u7814\u7a76\u4e2d\uff0c\u672a\u6765\u4f1a\u6709\u66f4\u591a\u7684\u9884\u8bad\u7ec3\u6a21\u578b\u5f00\u653e\u7ed9\u516c\u4f17\u3002<\/p>\n<p>\u6211\u4eec\u4e22\u5931\u4e86\u7528\u4e8e\u8bad\u7ec3\u6a21\u578b\u7684\u6e90\u4ee3\u7801\uff0c\u4f46\u672a\u6765\u5982\u679c\u627e\u5230\uff0c\u7b2c\u4e00\u65f6\u95f4\u66f4\u65b0\u5728\u6b64\u4ed3\u5e93\u4e2d\u3002<\/p>\n<p>\u6765\u81ea\u4f5c\u8005\u4e4b\u4e00\u7684\u79c1\u8bdd\uff1a<\/p>\n<p>\u300c\u5b89\u5f97\u5e7f\u53a6\u5343\u4e07\u95f4\u300d\uff0c\u8fd9\u4e2a repo \u670d\u52a1\u7684\u5bf9\u8c61\u662f\u300c\u5929\u4e0b\u5bd2\u58eb\u300d\u3002\u80fd\u5403\u9971\u3001\u7a7f\u6696\u7684\u9879\u76ee\u548c\u7814\u7a76\u8005\uff0c\u8bf7\u4e00\u5b9a\u8d2d\u4e70\u548c\u652f\u6301\u5546\u4e1a\u5316\u65b9\u6848\u3002\u4e70\u4e0d\u8d77\u3001\u7528\u4e0d\u8d77\u4f46\u662f\u60f3\u4e00\u8bd5\u7684\u300c\u5bd2\u58eb\u300d\uff0c\u81f3\u5c11\u8fd8\u6709\u4e00\u4e2a\u9009\u62e9\u3002\u8fd9\u4e2a\u6a21\u578b\u7684\u6b63\u786e\u7387\uff0c\u8bba\u6587\u4f5c\u8005\u4eec\u5f53\u65f6\u5c31\u8ba4\u4e3a\u8ddd\u79bb\u771f\u6b63\u80fd\u5e2e\u52a9\u4eba\u6587\u7814\u7a76\u8fd8\u8fdc\u5f97\u591a\uff0c\u6240\u4ee5\u4e00\u76f4\u4e5f\u6ca1\u6709\u53d1\u5e03\uff0c\u66f4\u4e0d\u8981\u8bf4\u5230\u4eca\u5929\u5927\u91cf\u66f4\u4f18\u79c0\u7684\u6a21\u578b\u53d1\u5e03\u3002\u4f46\u662f\u770b\u5230\u76f4\u5230 2021 \u5e74\uff0cGitHub \u4e0a\u5b8c\u5168\u641c\u4e0d\u5230\u4e00\u4e2a\u7528\u6765\u65ad\u53e5\u7684\u9884\u8bad\u7ec3\u6a21\u578b\uff0c\u5fc3\u91cc\u5c31\u5f88\u4e0d\u8212\u670d\u3002<\/p>\n<p>\u5982\u679c\u80fd\u7528\u8fd9\u4e2a\u9879\u76ee\u6765\u523a\u6fc0\u4e00\u4e9b\u7ec4\u5206\u4eab\u81ea\u5df1\u7684\u9884\u8bad\u7ec3\u6a21\u578b\uff0c\u5feb\u901f\u6dd8\u6c70\u8fd9\u4e2a\u8001\u65e7\u7684\u6a21\u578b\u3002\u5373\u4fbf\u662f\u8fd9\u6837\uff0c\u6211\u81ea\u5df1\u4e5f\u4f1a\u5f88\u6b23\u559c\u3002<\/p>\n<\/p><\/div>\n<div> <b>\u5927\u4f6c\u6709\u8a71\u8aaa<\/b> (<span>2<\/span>) <\/div>\n<div> <\/div>\n<\/p><\/div>\n<\/p><\/div>\n<ul>\n<li data-pid=\"7094889\" data-uid=\"2\">\n<div>\n<div>\n<div> <span>\u8cc7\u6df1\u5927\u4f6c : Chipmunker <\/span>  <\/div>\n<div> <i title=\"\u5f15\u7528\"><\/i>  <span>  <\/span> <\/div>\n<\/p><\/div>\n<div> \u597d\u50cf\u8bad\u7ec3\u6570\u636e\u96c6\u662f\u7b80\u4f53\u7684\u3002\u90a3\u662f\u4e0d\u662f\u4e0d\u80fd\u76f4\u63a5\u7528\u4e8e\u7e41\u4f53\u6587\u672c\uff1f <\/div>\n<\/p><\/div>\n<\/li>\n<li data-pid=\"7094890\" data-uid=\"2\">\n<div>\n<div>\n<div> <span>\u4e3b<\/span> <span>\u8cc7\u6df1\u5927\u4f6c : oopus <\/span>  <\/div>\n<div> <i title=\"\u5f15\u7528\"><\/i>  <span>  <\/span> <\/div>\n<\/p><\/div>\n<div> @Chipmunker \u8c22\u8c22\u4f60\u7684\u7ec6\u5fc3\u89c2\u5bdf\uff0c\u7e41\u7b80\u90fd\u53ef\u4ee5\u7684 <\/div>\n<\/p><\/div>\n<\/li>\n<li>\n","protected":false},"excerpt":{"rendered":"<p>\u6c49\u8bed\u53e4\u6587\u65ad\u53e5\u9884\u8bad\u7ec3\u6a21\u578b \u8cc7\u6df1\u5927\u4f6c &hellip;<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"closed","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":[],"categories":[],"tags":[],"_links":{"self":[{"href":"http:\/\/4563.org\/index.php?rest_route=\/wp\/v2\/posts\/553797"}],"collection":[{"href":"http:\/\/4563.org\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/4563.org\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/4563.org\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"http:\/\/4563.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=553797"}],"version-history":[{"count":0,"href":"http:\/\/4563.org\/index.php?rest_route=\/wp\/v2\/posts\/553797\/revisions"}],"wp:attachment":[{"href":"http:\/\/4563.org\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=553797"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/4563.org\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=553797"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/4563.org\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=553797"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}