{"id":6324,"date":"2026-06-09T11:50:57","date_gmt":"2026-06-09T03:50:57","guid":{"rendered":"https:\/\/ab123.xyz\/?p=6324"},"modified":"2026-06-09T11:50:57","modified_gmt":"2026-06-09T03:50:57","slug":"elasticsearch-for-news-archives-building-a-full-text-search-engine-for-editorial-databases","status":"publish","type":"post","link":"https:\/\/ab123.xyz\/?p=6324","title":{"rendered":"Elasticsearch for News Archives: Building a Full-Text Search Engine for Editorial Databases"},"content":{"rendered":"<p>\u5728\u5feb\u8282\u594f\u7684\u65b0\u95fb\u7f16\u8f91\u5ba4\u4e2d\uff0c\u5982\u4f55\u9ad8\u6548\u68c0\u7d22\u6d77\u91cf\u5386\u53f2\u65b0\u95fb\u62a5\u9053\u662f\u6bcf\u4e2a\u7f16\u8f91\u56e2\u961f\u7684\u75db\u70b9\u3002Elasticsearch \u6b63\u662f\u4e3a\u6b64\u800c\u751f\u7684\u5f00\u6e90\u5206\u5e03\u5f0f\u641c\u7d22\u4e0e\u5206\u6790\u5f15\u64ce\uff0c\u5b83\u80fd\u8ba9\u65b0\u95fb\u6863\u6848\u5b9e\u73b0\u6beb\u79d2\u7ea7\u5168\u6587\u68c0\u7d22\uff0c\u5f7b\u5e95\u6539\u53d8\u7f16\u8f91\u6570\u636e\u5e93\u7684\u4f7f\u7528\u4f53\u9a8c\u3002\u4ee5\u4e0b\u4e3a\u60a8\u6df1\u5ea6\u89e3\u6790\u8fd9\u6b3e\u5de5\u5177\u7684\u529f\u80fd\u3001\u4f18\u52bf\u53ca\u843d\u5730\u573a\u666f\u3002<\/p>\n<h2>\u6838\u5fc3\u529f\u80fd\uff1a\u8ba9\u65b0\u95fb\u6863\u6848\u201c\u6d3b\u201d\u8d77\u6765<\/h2>\n<p>Elasticsearch \u4e13\u4e3a\u5904\u7406\u975e\u7ed3\u6784\u5316\u6587\u672c\u6570\u636e\u8bbe\u8ba1\uff0c\u5176\u5012\u6392\u7d22\u5f15\u673a\u5236\u53ef\u77ac\u95f4\u5b8c\u6210\u5173\u952e\u8bcd\u5339\u914d\u3002\u5bf9\u4e8e\u65b0\u95fb\u7f16\u8f91\u5ba4\u800c\u8a00\uff0c\u8fd9\u610f\u5473\u7740\uff1a<\/p>\n<ul>\n<li><strong>\u5feb\u901f\u5168\u6587\u641c\u7d22<\/strong>\uff1a\u652f\u6301\u6a21\u7cca\u67e5\u8be2\u3001\u77ed\u8bed\u5339\u914d\u3001\u5e03\u5c14\u903b\u8f91\uff0c\u5373\u4f7f\u9762\u5bf9\u6570\u5341\u5e74\u7684\u62a5\u9053\u4e5f\u80fd\u79d2\u51fa\u7ed3\u679c\u3002<\/li>\n<li><strong>\u9ad8\u4eae\u7247\u6bb5\u5c55\u793a<\/strong>\uff1a\u81ea\u52a8\u5728\u641c\u7d22\u7ed3\u679c\u4e2d\u9ad8\u4eae\u5173\u952e\u8bcd\uff0c\u5e2e\u52a9\u7f16\u8f91\u5feb\u901f\u5b9a\u4f4d\u5173\u952e\u6bb5\u843d\u3002<\/li>\n<li><strong>\u591a\u7ef4\u5ea6\u8fc7\u6ee4<\/strong>\uff1a\u7ed3\u5408\u65e5\u671f\u3001\u4f5c\u8005\u3001\u5206\u7c7b\u7b49\u5143\u6570\u636e\u8fdb\u884c\u7cbe\u786e\u7b5b\u9009\uff0c\u4f8b\u5982\u201c2024\u5e74\u5173\u4e8e\u6c14\u5019\u53d8\u5316\u7684\u6df1\u5ea6\u62a5\u9053\u201d\u3002<\/li>\n<\/ul>\n<h3>\u9ad8\u7ea7\u5206\u6790\u80fd\u529b<\/h3>\n<p>\u5185\u7f6e\u805a\u5408\uff08Aggregations\uff09\u529f\u80fd\u53ef\u7edf\u8ba1\u65b0\u95fb\u70ed\u5ea6\u8d8b\u52bf\u3001\u4f5c\u8005\u53d1\u6587\u91cf\u3001\u8bdd\u9898\u8bcd\u4e91\u7b49\uff0c\u4e3a\u7f16\u8f91\u51b3\u7b56\u63d0\u4f9b\u6570\u636e\u652f\u6491\u3002<\/p>\n<h2>\u4e3a\u4f55\u65b0\u95fb\u7f16\u8f91\u5ba4\u9009\u62e9\u5b83<\/h2>\n<p>\u76f8\u6bd4\u4f20\u7edf\u5173\u7cfb\u578b\u6570\u636e\u5e93\u6216\u6587\u4ef6\u7cfb\u7edf\uff0cElasticsearch \u5177\u5907\u4e09\u5927\u4e0d\u53ef\u66ff\u4ee3\u7684\u4f18\u52bf\uff1a<\/p>\n<ul>\n<li><strong>\u6269\u5c55\u6027<\/strong>\uff1a\u652f\u6301\u6c34\u5e73\u6269\u5c55\uff0c\u8f7b\u677e\u5e94\u5bf9\u6bcf\u65e5\u6570\u4e07\u7bc7\u65b0\u62a5\u9053\u7684\u5199\u5165\uff0c\u96c6\u7fa4\u53ef\u8de8\u591a\u4e2a\u670d\u52a1\u5668\u90e8\u7f72\u3002<\/li>\n<li><strong>\u9ad8\u53ef\u7528\u6027<\/strong>\uff1a\u81ea\u52a8\u5206\u7247\u4e0e\u526f\u672c\u673a\u5236\u4fdd\u8bc1\u6570\u636e\u5b89\u5168\uff0c\u5355\u8282\u70b9\u6545\u969c\u4e0d\u5f71\u54cd\u670d\u52a1\u3002<\/li>\n<li><strong>\u751f\u6001\u4e30\u5bcc<\/strong>\uff1a\u914d\u5408 Kibana \u53ef\u89c6\u5316\u5de5\u5177\uff0c\u53ef\u6784\u5efa\u65b0\u95fb\u8206\u60c5\u4eea\u8868\u76d8\uff1b\u4e0e Logstash \u96c6\u6210\u5b9e\u73b0\u81ea\u52a8\u6293\u53d6\u4e0e\u5904\u7406\u3002<\/li>\n<\/ul>\n<h3>\u4f4e\u8fd0\u7ef4\u6210\u672c<\/h3>\n<p>\u5b98\u65b9\u63d0\u4f9b\u6258\u7ba1\u670d\u52a1 Elastic Cloud\uff0c\u65e0\u9700\u81ea\u5efa\u96c6\u7fa4\u5373\u53ef\u5feb\u901f\u542f\u52a8\uff0c\u8ba9\u7f16\u8f91\u56e2\u961f\u805a\u7126\u5185\u5bb9\u672c\u8eab\u800c\u975e\u57fa\u7840\u8bbe\u65bd\u3002<\/p>\n<h2>\u5e94\u7528\u573a\u666f\u4e0e\u5b9e\u6218\u6307\u5357<\/h2>\n<p>\u5728\u5b9e\u9645\u65b0\u95fb\u7f16\u8f91\u5ba4\u4e2d\uff0cElasticsearch \u5df2\u88ab\u7528\u4e8e\uff1a<\/p>\n<ul>\n<li><strong>\u5386\u53f2\u65b0\u95fb\u68c0\u7d22<\/strong>\uff1a\u8bb0\u8005\u64b0\u5199\u80cc\u666f\u8c03\u67e5\u65f6\uff0c\u4e00\u952e\u8c03\u53d6\u4e94\u5e74\u524d\u7684\u76f8\u5173\u62a5\u9053\u3002<\/li>\n<li><strong>\u4e13\u9898\u62a5\u9053\u805a\u5408<\/strong>\uff1a\u81ea\u52a8\u5c06\u540c\u4e00\u4e8b\u4ef6\u7684\u8fde\u7eed\u62a5\u9053\u6c47\u603b\u6210\u65f6\u95f4\u7ebf\u3002<\/li>\n<li><strong>\u6743\u9650\u7ba1\u7406<\/strong>\uff1a\u6309\u90e8\u95e8\u6216\u7528\u6237\u7ec4\u8bbe\u7f6e\u641c\u7d22\u8303\u56f4\uff0c\u4fdd\u62a4\u4ed8\u8d39\u5185\u5bb9\u3002<\/li>\n<\/ul>\n<h3>\u5feb\u901f\u4e0a\u624b\u6307\u5357<\/h3>\n<p>\u7b2c\u4e00\u6b65\uff1a\u5b89\u88c5 Elasticsearch\uff08\u63a8\u8350\u4f7f\u7528 Docker \u90e8\u7f72\uff09\u3002\u7b2c\u4e8c\u6b65\uff1a\u901a\u8fc7 RESTful API \u521b\u5efa\u7d22\u5f15\u5e76\u5b9a\u4e49\u6620\u5c04\uff08Mapping\uff09\uff0c\u5c06\u65b0\u95fb\u6807\u9898\u3001\u6b63\u6587\u3001\u65e5\u671f\u7b49\u5b57\u6bb5\u7ed3\u6784\u5316\u3002\u7b2c\u4e09\u6b65\uff1a\u6279\u91cf\u5bfc\u5165\u5386\u53f2\u6570\u636e\uff08\u652f\u6301 JSON\u3001CSV \u683c\u5f0f\uff09\u3002\u7b2c\u56db\u6b65\uff1a\u8c03\u7528 Search API \u6216\u96c6\u6210\u5230 CMS \u7cfb\u7edf\u4e2d\u3002\u5b98\u65b9\u6587\u6863\u63d0\u4f9b\u4e86\u4e30\u5bcc\u7684\u6a21\u677f\u548c\u793a\u4f8b\uff0c\u964d\u4f4e\u5b66\u4e60\u66f2\u7ebf\u3002<\/p>\n<p>\u7acb\u5373\u8bbf\u95ee <a href=\"https:\/\/www.elastic.co\/\" target=\"_blank\">\u5b98\u65b9\u7f51\u7ad9<\/a> \u83b7\u53d6\u514d\u8d39\u8bd5\u7528\uff0c\u6216\u4e0b\u8f7d\u793e\u533a\u7248\u5f00\u59cb\u642d\u5efa\u60a8\u7684\u4e13\u5c5e\u65b0\u95fb\u5168\u6587\u672c\u641c\u7d22\u7cfb\u7edf\u3002<\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u5728\u5feb\u8282\u594f\u7684\u65b0\u95fb\u7f16\u8f91\u5ba4\u4e2d\uff0c\u5982\u4f55\u9ad8\u6548\u68c0\u7d22\u6d77\u91cf\u5386\u53f2\u65b0\u95fb\u62a5\u9053\u662f\u6bcf\u4e2a\u7f16\u8f91\u56e2\u961f\u7684\u75db\u70b9\u3002Elasticsearch \u6b63\u662f\u4e3a\u6b64 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[4],"tags":[8079,8078,8081,8077,8080],"class_list":["post-6324","post","type-post","status-publish","format-standard","hentry","category-4","tag-elasticsearch","tag-8078","tag-8081","tag-8077","tag-8080"],"_links":{"self":[{"href":"https:\/\/ab123.xyz\/index.php?rest_route=\/wp\/v2\/posts\/6324","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/ab123.xyz\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/ab123.xyz\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/ab123.xyz\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/ab123.xyz\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=6324"}],"version-history":[{"count":1,"href":"https:\/\/ab123.xyz\/index.php?rest_route=\/wp\/v2\/posts\/6324\/revisions"}],"predecessor-version":[{"id":6325,"href":"https:\/\/ab123.xyz\/index.php?rest_route=\/wp\/v2\/posts\/6324\/revisions\/6325"}],"wp:attachment":[{"href":"https:\/\/ab123.xyz\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=6324"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/ab123.xyz\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=6324"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/ab123.xyz\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=6324"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}