{"id":20566,"date":"2024-08-29T16:10:07","date_gmt":"2024-08-29T08:10:07","guid":{"rendered":"https:\/\/17aitech.com\/?p=20566"},"modified":"2024-10-08T15:08:19","modified_gmt":"2024-10-08T07:08:19","slug":"%e3%80%90%e8%af%be%e7%a8%8b%e6%80%bb%e7%bb%93%e3%80%91day29%ef%bc%9a%e5%a4%a7%e6%a8%a1%e5%9e%8b%e4%b9%8b%e6%b7%b1%e5%85%a5%e4%ba%86%e8%a7%a3retrievers%e8%a7%a3%e6%9e%90%e5%99%a8","status":"publish","type":"post","link":"https:\/\/17aitech.com\/?p=20566","title":{"rendered":"\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day29\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u4e86\u89e3Retrievers\u89e3\u6790\u5668"},"content":{"rendered":"<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_78 ez-toc-wrap-left-text counter-hierarchy ez-toc-counter ez-toc-light-blue ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\">\n<p class=\"ez-toc-title\" style=\"cursor:inherit\">\u6587\u7ae0\u76ee\u5f55<\/p>\n<span class=\"ez-toc-title-toggle\"><a href=\"#\" class=\"ez-toc-pull-right ez-toc-btn ez-toc-btn-xs ez-toc-btn-default ez-toc-toggle\" aria-label=\"Toggle Table of Content\"><span class=\"ez-toc-js-icon-con\"><span class=\"\"><span class=\"eztoc-hide\" style=\"display:none;\">Toggle<\/span><span class=\"ez-toc-icon-toggle-span\"><svg style=\"fill: #999;color:#999\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" class=\"list-377408\" width=\"20px\" height=\"20px\" viewBox=\"0 0 24 24\" fill=\"none\"><path d=\"M6 6H4v2h2V6zm14 0H8v2h12V6zM4 11h2v2H4v-2zm16 0H8v2h12v-2zM4 16h2v2H4v-2zm16 0H8v2h12v-2z\" fill=\"currentColor\"><\/path><\/svg><svg style=\"fill: #999;color:#999\" class=\"arrow-unsorted-368013\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"10px\" height=\"10px\" viewBox=\"0 0 24 24\" version=\"1.2\" baseProfile=\"tiny\"><path d=\"M18.2 9.3l-6.2-6.3-6.2 6.3c-.2.2-.3.4-.3.7s.1.5.3.7c.2.2.4.3.7.3h11c.3 0 .5-.1.7-.3.2-.2.3-.5.3-.7s-.1-.5-.3-.7zM5.8 14.7l6.2 6.3 6.2-6.3c.2-.2.3-.5.3-.7s-.1-.5-.3-.7c-.2-.2-.4-.3-.7-.3h-11c-.3 0-.5.1-.7.3-.2.2-.3.5-.3.7s.1.5.3.7z\"\/><\/svg><\/span><\/span><\/span><\/a><\/span><\/div>\n<nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%89%8D%E8%A8%80\" >\u524d\u8a00<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E8%A7%A3%E6%9E%90%E5%99%A8%E7%AE%80%E4%BB%8B\" >\u89e3\u6790\u5668\u7b80\u4ecb<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E8%A7%A3%E6%9E%90%E5%99%A8%E7%9A%84%E5%9F%BA%E7%A1%80%E4%BD%BF%E7%94%A8\" >\u89e3\u6790\u5668\u7684\u57fa\u7840\u4f7f\u7528<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%88%9B%E5%BB%BA%E7%9F%A5%E8%AF%86%E5%BA%93\" >\u521b\u5efa\u77e5\u8bc6\u5e93<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%88%9B%E5%BB%BA%E8%A7%A3%E6%9E%90%E5%99%A8\" >\u521b\u5efa\u89e3\u6790\u5668<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%88%9B%E5%BB%BAchain%E9%93%BE\" >\u521b\u5efachain\u94fe<\/a><ul class='ez-toc-list-level-4' ><li class='ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E6%96%B9%E5%BC%8F%E4%B8%80%EF%BC%9A%E4%BC%A0%E7%BB%9F%E7%9A%84%E7%AE%A1%E9%81%93%E7%AC%A6%E6%9E%84%E5%BB%BAchain\" >\u65b9\u5f0f\u4e00\uff1a\u4f20\u7edf\u7684\u7ba1\u9053\u7b26\u6784\u5efachain<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E6%96%B9%E5%BC%8F%E4%BA%8C%EF%BC%9A%E4%BD%BF%E7%94%A8create_retrieval_chain%E6%9E%84%E5%BB%BA\" >\u65b9\u5f0f\u4e8c\uff1a\u4f7f\u7528create_retrieval_chain\u6784\u5efa<\/a><\/li><\/ul><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E8%A7%A3%E6%9E%90%E5%99%A8%E7%9A%84%E4%B8%8D%E5%90%8C%E7%B1%BB%E5%9E%8B\" >\u89e3\u6790\u5668\u7684\u4e0d\u540c\u7c7b\u578b<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-10\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%A4%9A%E6%9F%A5%E8%AF%A2%E6%A3%80%E7%B4%A2%E5%99%A8_MultiQueryRetriever\" >\u591a\u67e5\u8be2\u68c0\u7d22\u5668 MultiQueryRetriever<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-11\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E7%BB%93%E5%90%88%E6%A3%80%E7%B4%A2%E5%99%A8_EnsembleRetriever\" >\u7ed3\u5408\u68c0\u7d22\u5668 EnsembleRetriever<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-12\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E9%95%BF%E4%B8%8A%E4%B8%8B%E6%96%87%E9%87%8D%E6%8E%92%E5%BA%8F_LongContextReorder\" >\u957f\u4e0a\u4e0b\u6587\u91cd\u6392\u5e8f LongContextReorder<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-13\" href=\"https:\/\/17aitech.com\/?p=20566\/#ElasticSearchBM25Retriever\" >ElasticSearchBM25Retriever<\/a><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-14\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E8%87%AA%E5%AE%9A%E4%B9%89%E4%B8%80%E4%B8%AAretriever\" >\u81ea\u5b9a\u4e49\u4e00\u4e2aretriever<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-15\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E9%99%84%E5%BD%95\" >\u9644\u5f55<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-16\" href=\"https:\/\/17aitech.com\/?p=20566\/#ElasticSearch%E7%9A%84Docker%E5%AE%89%E8%A3%85%E6%95%99%E7%A8%8B\" >ElasticSearch\u7684Docker\u5b89\u88c5\u6559\u7a0b<\/a><ul class='ez-toc-list-level-4' ><li class='ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-17\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%AE%89%E8%A3%85Docker\" >\u5b89\u88c5Docker<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-18\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%88%9B%E5%BB%BA%E7%BD%91%E7%BB%9C\" >\u521b\u5efa\u7f51\u7edc<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-19\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E6%8B%89%E5%8F%96%E9%95%9C%E5%83%8F\" >\u62c9\u53d6\u955c\u50cf<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-20\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%88%9B%E5%BB%BA%E6%8C%82%E8%BD%BD%E7%82%B9%E7%9B%AE%E5%BD%95\" >\u521b\u5efa\u6302\u8f7d\u70b9\u76ee\u5f55<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-21\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%90%AF%E5%8A%A8%E5%AE%B9%E5%99%A8\" >\u542f\u52a8\u5bb9\u5668<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-4'><a class=\"ez-toc-link ez-toc-heading-22\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E4%BF%AE%E6%94%B9elasticsearch%E7%9A%84%E5%AF%86%E7%A0%81\" >\u4fee\u6539elasticsearch\u7684\u5bc6\u7801<\/a><\/li><\/ul><\/li><\/ul><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-23\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%86%85%E5%AE%B9%E5%B0%8F%E7%BB%93\" >\u5185\u5bb9\u5c0f\u7ed3<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-24\" href=\"https:\/\/17aitech.com\/?p=20566\/#%E5%8F%82%E8%80%83%E8%B5%84%E6%96%99\" >\u53c2\u8003\u8d44\u6599<\/a><\/li><\/ul><\/nav><\/div>\n<h2><span class=\"ez-toc-section\" id=\"%E5%89%8D%E8%A8%80\"><\/span>\u524d\u8a00<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u5728\u4e0a\u4e00\u7ae0<a href=\"https:\/\/17aitech.com\/?p=18186\">\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day28\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u63a2\u7d22RAG\u6d41\u7a0b<\/a>\u4e2d\uff0c\u6211\u4eec\u5bf9RAG\u6d41\u7a0b\u4e2d <code>\u6587\u6863\u8bfb\u53d6(LOAD)<\/code> -&gt; <code>\u6587\u6863\u5207\u5206(SPLIT)<\/code> -&gt; <code>\u5411\u91cf\u5316(EMBED)<\/code> -&gt; <code>\u5b58\u50a8(STORE)<\/code> \u8fdb\u884c\u4e86\u6df1\u5165\u4e86\u89e3\uff0c\u672c\u7ae0\u5c06\u63a5\u7740\u6df1\u5165\u4e86\u89e3 <code>\u89e3\u6790(Retrieval)<\/code> \u7684\u4f7f\u7528<\/p>\n<h2><span class=\"ez-toc-section\" id=\"%E8%A7%A3%E6%9E%90%E5%99%A8%E7%AE%80%E4%BB%8B\"><\/span>\u89e3\u6790\u5668\u7b80\u4ecb<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/retriever\u6d41\u7a0b.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/retriever\u6d41\u7a0b.png\" alt=\"\" \/><\/a><\/p>\n<p><strong>\u7b80\u4ecb<\/strong>\uff1a\u5728 RAG\uff08Retrieval-Augmented Generation\uff09\u6d41\u7a0b\u4e2d\uff0cRetrieval\uff08\u68c0\u7d22\uff09\u662f\u5173\u952e\u73af\u8282\uff0c\u5176\u4e3b\u8981\u76ee\u6807\u662f\u4ece\u5927\u91cf\u6587\u6863\u6216\u77e5\u8bc6\u5e93\u4e2d\u63d0\u53d6\u4e0e\u7528\u6237\u67e5\u8be2\u76f8\u5173\u7684\u4fe1\u606f\u3002<\/p>\n<p><strong>\u76ee\u7684<\/strong>\uff1a<\/p>\n<ul>\n<li>\u4fe1\u606f\u83b7\u53d6\uff1a\u6839\u636e\u7528\u6237\u7684\u67e5\u8be2\uff0c\u4ece\u5916\u90e8\u77e5\u8bc6\u5e93\u4e2d\u83b7\u53d6\u76f8\u5173\u6587\u6863\u6216\u7247\u6bb5\uff0c\u4ee5\u589e\u5f3a\u751f\u6210\u6a21\u578b\u7684\u4e0a\u4e0b\u6587\u4fe1\u606f\u3002<\/li>\n<li>\u63d0\u9ad8\u51c6\u786e\u6027\uff1a\u901a\u8fc7\u63d0\u4f9b\u5177\u4f53\u7684\u3001\u76f8\u5173\u7684\u4fe1\u606f\uff0c\u5e2e\u52a9\u751f\u6210\u6a21\u578b\uff08\u5982\u8bed\u8a00\u6a21\u578b\uff09\u4ea7\u751f\u66f4\u51c6\u786e\u548c\u4e0a\u4e0b\u6587\u76f8\u5173\u7684\u56de\u7b54\u3002<\/li>\n<\/ul>\n<p><strong>\u6d41\u7a0b<\/strong><\/p>\n<ol>\n<li>\u7528\u6237\u67e5\u8be2\uff1a\u7528\u6237\u8f93\u5165\u4e00\u4e2a\u67e5\u8be2\u6216\u95ee\u9898\u3002<\/li>\n<li>\u68c0\u7d22\u5668\uff1a\u4f7f\u7528\u68c0\u7d22\u7b97\u6cd5\uff08\u5982 BM25\u3001TF-IDF \u6216\u57fa\u4e8e\u5d4c\u5165\u7684\u68c0\u7d22\uff09\u641c\u7d22\u77e5\u8bc6\u5e93\uff0c\u627e\u5230\u4e0e\u67e5\u8be2\u6700\u76f8\u5173\u7684\u6587\u6863\u3002<\/li>\n<li>\u6587\u6863\u8bc4\u5206\uff1a\u5bf9\u68c0\u7d22\u5230\u7684\u6587\u6863\u8fdb\u884c\u8bc4\u5206\uff0c\u901a\u5e38\u4f9d\u636e\u76f8\u5173\u6027\u5f97\u5206\u6765\u6392\u5e8f\u3002<\/li>\n<li>\u8fd4\u56de\u7ed3\u679c\uff1a\u5c06\u6700\u76f8\u5173\u7684\u6587\u6863\u6216\u7247\u6bb5\u8fd4\u56de\u7ed9\u751f\u6210\u6a21\u578b\u3002<\/li>\n<\/ol>\n<h2><span class=\"ez-toc-section\" id=\"%E8%A7%A3%E6%9E%90%E5%99%A8%E7%9A%84%E5%9F%BA%E7%A1%80%E4%BD%BF%E7%94%A8\"><\/span>\u89e3\u6790\u5668\u7684\u57fa\u7840\u4f7f\u7528<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<h3><span class=\"ez-toc-section\" id=\"%E5%88%9B%E5%BB%BA%E7%9F%A5%E8%AF%86%E5%BA%93\"><\/span>\u521b\u5efa\u77e5\u8bc6\u5e93<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p><strong>\u7b2c\u4e00\u6b65<\/strong>\uff1a\u542f\u52a8Chroma\u6570\u636e\u5e93<\/p>\n<pre><code class=\"language-bash\">chroma run --path chroma_xiyou --port 8000<\/code><\/pre>\n<p><strong>\u7b2c\u4e8c\u6b65<\/strong>\uff1a\u4f7f\u7528<a href=\"https:\/\/17aitech.com\/?p=18186\">RAG\u57fa\u7840\u6d41\u7a0b\uff1aLoad-&gt;Split-&gt;EMBED-&gt;STORE<\/a>\u521b\u5efa\u4e00\u4e2a\u77e5\u8bc6\u5e93<\/p>\n<pre><code class=\"language-python\">from langchain_text_splitters import RecursiveCharacterTextSplitter\nfrom langchain.embeddings import HuggingFaceEmbeddings\nfrom langchain.document_loaders import PyMuPDFLoader\nfrom langchain_chroma import Chroma\nfrom chromadb import Settings\nfrom chromadb import Client\nfrom utils import get_ernie_models\nimport chromadb\n\n# \u8fde\u63a5\u5927\u6a21\u578b\nllm_ernie, chat_ernie, embed_ernie = get_ernie_models()\n\n# \u521d\u59cb\u5316 HuggingFaceEmbeddings\nembedding_function = HuggingFaceEmbeddings(model_name=&quot;bert-base-chinese&quot;)\n\n# \u52a0\u8f7d\u6587\u6863\npdf_loader = PyMuPDFLoader(&quot;testfiles\/\u897f\u6e38\u8bb0.pdf&quot;)\ndocuments = pdf_loader.load()\n\n# \u5207\u5206\u6587\u6863\nspliter = RecursiveCharacterTextSplitter(chunk_size=128, chunk_overlap=64)\ndocs = spliter.split_documents(documents)\n\n# \u914d\u7f6e\u8fde\u63a5\u4fe1\u606f\nclient = chromadb.HttpClient(host=&#039;localhost&#039;, port=8000)\n\nchroma_db = Chroma(\n    embedding_function=embedding_function,\n    client=client\n)\n\nbatch_size = 6  # \u6bcf\u6b21\u5904\u7406\u7684\u6837\u672c\u6570\u91cf\n\n# \u5206\u6279\u5165\u5e93\nfor i in range(0, len(docs), batch_size):\n    batch = docs[i:i + batch_size]  # \u83b7\u53d6\u5f53\u524d\u6279\u6b21\u7684\u6837\u672c\n    print(f&#039;Processing batch {i} to {i + batch_size}, total {len(batch)} samples&#039;)\n    chroma_db.add_documents(documents=batch)  # \u5165\u5e93<\/code><\/pre>\n<p>\u8bf4\u660e\uff1a<\/p>\n<ul>\n<li><strong>\u5411\u91cf\u5316\u8bf4\u660e<\/strong>\uff1a\u7531\u4e8eQwen\u548c\u767e\u5ea6\u5343\u5e06\u7684\u5411\u91cf\u63a5\u53e3\u9650\u5236\u8f83\u591a\uff0c\u5bf9\u4e8e\u5411\u91cf\u5316\u897f\u6e38\u8bb0\u8fd9\u672c\u4e66\u6765\u8bf4\uff0c\u7ecf\u5e38\u4f1a\u9047\u5230\u8d85\u51fa\u9650\u5236\u7b49\u95ee\u9898\uff0c\u6240\u4ee5\u6b64\u5904\u6211\u5c06\u5411\u91cf\u5316\u63a5\u53e3\u6362\u4e3aHuggingFaceEmbeddings()\uff0c\u8be5\u63a5\u53e3\u53ef\u80fd\u4f1a\u5b58\u5728\u88abBan\u7684\u98ce\u9669\uff0c\u8bf7\u81ea\u884c\u66f4\u6362\u5411\u91cf\u5316\u63a5\u53e3\u3002<\/li>\n<li><strong>\u6d4b\u8bd5\u6587\u6863<\/strong>\uff1a\u897f\u6e38\u8bb0\u4e0b\u8f7d\u5730\u5740\u8bf7\u89c1<a href=\"https:\/\/pan.quark.cn\/s\/93b12d4185eb#\/list\/share\/e912eb82cdc34d2fb893e62a880ebd9b-%E8%A5%BF%E6%B8%B8%E8%AE%B0(%E8%AE%B0%E5%BE%97%E4%BF%9D%E5%AD%98%E5%88%B0%E4%BA%91%E7%9B%98)\">\u5938\u514b\u7f51\u76d8\uff1a\u897f\u6e38\u8bb0<\/a><\/li>\n<\/ul>\n<h3><span class=\"ez-toc-section\" id=\"%E5%88%9B%E5%BB%BA%E8%A7%A3%E6%9E%90%E5%99%A8\"><\/span>\u521b\u5efa\u89e3\u6790\u5668<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p><strong>\u7b2c\u4e09\u6b65<\/strong>\uff1a\u521b\u5efa\u4e00\u4e2a\u89e3\u6790\u5668<\/p>\n<pre><code class=\"language-python\">retriever = chroma_db.as_retriever()<\/code><\/pre>\n<h3><span class=\"ez-toc-section\" id=\"%E5%88%9B%E5%BB%BAchain%E9%93%BE\"><\/span>\u521b\u5efachain\u94fe<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u521b\u5efachain\u94fe\u6709\u4e24\u79cd\u65b9\u6cd5\uff1a\u4e00\u79cd\u662f\u7ba1\u9053\u7b26\u8fde\u63a5\uff0c\u4e00\u79cd\u662f\u4f7f\u7528 create_retrieval_chain \u3002\u672c\u7ae0\u6211\u4eec\u4e24\u79cd\u65b9\u6cd5\u90fd\u505a\u5c1d\u8bd5\uff0c\u4ee5\u4fbf\u5bf9\u6bd4\u4ee3\u7801\u7684\u5199\u6cd5\u3002<\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E6%96%B9%E5%BC%8F%E4%B8%80%EF%BC%9A%E4%BC%A0%E7%BB%9F%E7%9A%84%E7%AE%A1%E9%81%93%E7%AC%A6%E6%9E%84%E5%BB%BAchain\"><\/span>\u65b9\u5f0f\u4e00\uff1a\u4f20\u7edf\u7684\u7ba1\u9053\u7b26\u6784\u5efachain<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<pre><code class=\"language-python\"># RAG\u7cfb\u7edf\u7ecf\u5178\u7684 Prompt \nprompt = ChatPromptTemplate.from_messages([\n  (&quot;human&quot;, &quot;&quot;&quot;You are an assistant for question-answering tasks. Use the following pieces \n  of retrieved context to answer the question. \n  If you don&#039;t know the answer, just say that you don&#039;t know. \n  Use three sentences maximum and keep the answer concise.\n  Question: {question} \n  Context: {context} \n  Answer:&quot;&quot;&quot;)\n])\n\ndef format_docs(docs):\n    return &quot;\\n\\n&quot;.join(doc.page_content for doc in docs)\n\n# RAG \u94fe\nrag_chain = (\n    {&quot;context&quot;: retriever | format_docs, \n     &quot;question&quot;: RunnablePassthrough()}\n    | prompt\n    | chat_ernie\n    | StrOutputParser()\n)\n\nrag_chain.invoke(input=&quot;\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u54ea\u4e9b\u5f62\u6001?&quot;)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u4f20\u7edfRAG\u8fd0\u884c\u622a\u56fe.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u4f20\u7edfRAG\u8fd0\u884c\u622a\u56fe.png\" alt=\"\" \/><\/a><\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E6%96%B9%E5%BC%8F%E4%BA%8C%EF%BC%9A%E4%BD%BF%E7%94%A8create_retrieval_chain%E6%9E%84%E5%BB%BA\"><\/span>\u65b9\u5f0f\u4e8c\uff1a\u4f7f\u7528create_retrieval_chain\u6784\u5efa<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<pre><code class=\"language-python\">from langchain.chains import create_retrieval_chain\nfrom langchain.chains.combine_documents import create_stuff_documents_chain\nfrom langchain_core.prompts import ChatPromptTemplate\n\nprompt = ChatPromptTemplate.from_messages([\n  (&quot;system&quot;, &quot;&quot;&quot;Answer any use questions based solely on the context below:\n&lt;context&gt;\n{context}\n&lt;\/context&gt;&quot;&quot;&quot;),\n  (&quot;placeholder&quot;, &quot;{chat_history}&quot;),\n  (&quot;human&quot;, &quot;{input}&quot;),\n])\n\ncombine_docs_chain = create_stuff_documents_chain(\n    llm=chat_ernie,prompt= prompt\n)\n\nchain = create_retrieval_chain(retriever=retriever, combine_docs_chain=combine_docs_chain)\n\nchain.invoke(input={&quot;input&quot;:&quot;\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u54ea\u4e9b\u5f62\u6001?&quot;})<\/code><\/pre>\n<p>\u8bf4\u660e\uff1a<\/p>\n<ul>\n<li>\u4e0a\u8ff0\u7684prompt\u53ef\u4ee5\u5728<a href=\"https:\/\/smith.langchain.com\/hub\/langchain-ai\/retrieval-qa-chat\">smith.langchain.com<\/a>\u4e0a\u67e5\u8be2<code>langchain-ai\/retrieval-qa-chat<\/code>\u5f97\u5230\u3002<\/li>\n<\/ul>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/create_retrieval\u7684\u6267\u884c\u7ed3\u679c.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/create_retrieval\u7684\u6267\u884c\u7ed3\u679c.png\" alt=\"\" \/><\/a><\/p>\n<p>\u901a\u8fc7\u5bf9\u6bd4\uff0c\u53ef\u4ee5\u770b\u5230\u4f7f\u7528 <code>create_retrieval_chain<\/code> \u521b\u5efachain\u65f6\uff0c\u53ef\u4ee5\u51cf\u5c11format_docs()\u6b65\u9aa4\u4ee5\u53ca\u4f7f\u7528\u7ba1\u9053\u7b26\u90e8\u5206\u7684\u4ee3\u7801\u91cf\uff0c\u7b80\u5316\u8c03\u7528\u6b65\u9aa4\u3002<\/p>\n<p>\u4ee5\u4e0a\u8c03\u7528\u5373\u4e3a\u5b8c\u6574\u7684\u89e3\u6790\u5668\u4f7f\u7528\u6d41\u7a0b\uff0c\u5176\u4e2d\u7b2c\u4e09\u6b65\u4e2d <code>retriever = chroma_db.as_retriever()<\/code> \u53ef\u4ee5\u6709\u591a\u79cd\u65b9\u5f0f\u6784\u5efa\u89e3\u6790\u5668\u3002\u672c\u7ae0\u5185\u5bb9\uff0c\u6211\u4eec\u7740\u91cd\u5bf9\u6b64\u6df1\u5165\u7814\u7a76\u3002<\/p>\n<h2><span class=\"ez-toc-section\" id=\"%E8%A7%A3%E6%9E%90%E5%99%A8%E7%9A%84%E4%B8%8D%E5%90%8C%E7%B1%BB%E5%9E%8B\"><\/span>\u89e3\u6790\u5668\u7684\u4e0d\u540c\u7c7b\u578b<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>\u9664\u4e86\u4e0a\u9762\u57fa\u7840\u7684\u5411\u91cf\u5b58\u50a8\u68c0\u7d22\u5668\u4e4b\u5916\uff0cLangchain \u8fd8\u63d0\u4f9b\u4e86\u591a\u79cd\u9ad8\u7ea7\u68c0\u7d22\u7c7b\u578b\uff0c\u5305\u62ec\u591a\u67e5\u8be2\u68c0\u7d22\u5668\uff08MultiQueryRetriever\uff09\u3001\u7ed3\u5408\u68c0\u7d22\u5668\uff08EnsembleRetriever\uff09\u7b49\u3002<\/p>\n<h3><span class=\"ez-toc-section\" id=\"%E5%A4%9A%E6%9F%A5%E8%AF%A2%E6%A3%80%E7%B4%A2%E5%99%A8_MultiQueryRetriever\"><\/span>\u591a\u67e5\u8be2\u68c0\u7d22\u5668 MultiQueryRetriever<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p><strong>\u7b80\u4ecb<\/strong>:<br \/>\n<code>MultiQueryRetriever<\/code> \u662f\u4e00\u79cd\u68c0\u7d22\u7b97\u6cd5\uff0c\u5b83\u901a\u8fc7\u4f7f\u7528\u5927\u578b\u8bed\u8a00\u6a21\u578b(LLM)\u751f\u6210\u591a\u4e2a\u67e5\u8be2\uff0c\u4ece\u800c\u81ea\u52a8\u5316\u63d0\u793a\u8c03\u4f18\u8fc7\u7a0b\u3002<\/p>\n<p><strong>\u529f\u80fd<\/strong>:<br \/>\n\u5b83\u4e3a\u7ed9\u5b9a\u7684\u7528\u6237\u8f93\u5165\u67e5\u8be2\u751f\u6210\u591a\u4e2a\u4e0d\u540c\u89c6\u89d2\u7684\u67e5\u8be2\u3002\u5bf9\u4e8e\u6bcf\u4e2a\u67e5\u8be2\uff0c\u5b83\u68c0\u7d22\u4e00\u7ec4\u76f8\u5173\u6587\u6863\uff0c\u5e76\u901a\u8fc7\u6240\u6709\u67e5\u8be2\u7684\u552f\u4e00\u8054\u5408\u6765\u83b7\u5f97\u66f4\u5927\u7684\u4e00\u7ec4\u6f5c\u5728\u76f8\u5173\u6587\u6863\u3002\u8fd9\u79cd\u65b9\u6cd5\u63d0\u9ad8\u4e86\u68c0\u7d22\u7684\u51c6\u786e\u6027\u548c\u591a\u6837\u6027\u3002<\/p>\n<p><strong>\u4f7f\u7528\u573a\u666f<\/strong>:<br \/>\n\u5f53\u7528\u6237\u7684\u95ee\u9898\u590d\u6742\u5e76\u4e14\u9700\u8981\u591a\u6761\u4e0d\u540c\u7684\u4fe1\u606f\u6765\u56de\u7b54\u65f6\uff0c<code>MultiQueryRetriever<\/code> \u7279\u522b\u6709\u7528\u3002\u5b83\u53ef\u4ee5\u5728\u9700\u8981\u5173\u4e8e\u591a\u4e2a\u4e3b\u9898\u7684\u4fe1\u606f\u65f6\u63d0\u4f9b\u66f4\u5168\u9762\u7684\u7ed3\u679c<\/p>\n<p><strong>\u4f7f\u7528\u65b9\u6cd5<\/strong>\uff1a<br \/>\n<strong>\u7b2c\u4e00\u6b65<\/strong>\uff1a\u6784\u5efa\u77e5\u8bc6\u5e93(\u6b64\u5904\u590d\u7528\u4e0a\u9762\u7684\u77e5\u8bc6\u5e93\uff0c\u8be6\u7ec6\u5185\u5bb9\u4e0d\u518d\u8d58\u8ff0)<\/p>\n<p><strong>\u7b2c\u4e8c\u6b65<\/strong>\uff1a\u4f7f\u7528MultiQueryRetriever<\/p>\n<pre><code class=\"language-python\">import logging\nfrom langchain.retrievers.multi_query import MultiQueryRetriever\n\nquestion = &quot;\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u54ea\u4e9b\u5f62\u6001?&quot;\n\n# \u628a\u5411\u91cf\u64cd\u4f5c\u5c01\u88c5\u4e3a\u4e00\u4e2a\u57fa\u672c\u68c0\u7d22\u5668\nretriever = chroma_db.as_retriever()\n\nretriever_from_llm = MultiQueryRetriever.from_llm(\n    retriever=chroma_db.as_retriever(), llm=chat_ernie\n)\n\nlogging.basicConfig()\nlogging.getLogger(&quot;langchain.retrievers.multi_query&quot;).setLevel(logging.INFO)\n\nunique_docs = retriever_from_llm.get_relevant_documents(query=question)\nunique_docs\n\nprint(f&#039;\u8fd4\u56de\u7684\u6587\u6863\u4e2a\u6570\uff1a{len(unique_docs)}&#039;)\nprint(f&#039;\u8fd4\u56de\u7684\u6587\u6863\u5185\u5bb9\uff1a&#039;)\nfor doc in unique_docs:\n    print(doc.page_content)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<\/p>\n<pre><code class=\"language-bash\">INFO:langchain.retrievers.multi_query:Generated \nqueries: [&#039;\u4ee5\u4e0b\u662f\u4e09\u4e2a\u4e0d\u540c\u7248\u672c\u7684\u751f\u6210\u95ee\u9898\uff0c\u65e8\u5728\u4ece\u4e0d\u540c\u89d2\u5ea6\u63a2\u7d22\u539f\u59cb\u95ee\u9898\u7684\u76f8\u5173\u4fe1\u606f\uff1a&#039;, \n&#039;1. \u5b59\u609f\u7a7a\u5728\u4e09\u6253\u767d\u9aa8\u7cbe\u7684\u60c5\u8282\u4e2d\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u5316\u4f5c\u4e86\u54ea\u4e9b\u751f\u7269\u6216\u7269\u4f53\u5f62\u6001\uff1f&#039;, \n&#039;2. \u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u53d8\u8eab\u7684\u5f62\u6001\u6709\u54ea\u4e9b\uff1f\u8bf7\u8be6\u7ec6\u5217\u51fa\u3002&#039;, \n&#039;3. \u5728\u300a\u897f\u6e38\u8bb0\u300b\u4e2d\uff0c\u767d\u9aa8\u7cbe\u5728\u5b59\u609f\u7a7a\u4e09\u6253\u5979\u7684\u8fc7\u7a0b\u4e2d\uff0c\u5979\u53d8\u6362\u6210\u4e86\u54ea\u4e9b\u4e0d\u540c\u7684\u8eab\u4efd\u6216\u5916\u89c2\uff1f&#039;, \n&#039;\u5e0c\u671b\u4ee5\u4e0a\u95ee\u9898\u53ef\u4ee5\u5e2e\u52a9\u4f60\u4ece\u4e0d\u540c\u7684\u89d2\u5ea6\u83b7\u53d6\u76f8\u5173\u4fe1\u606f\uff0c\u4ece\u800c\u66f4\u5168\u9762\u5730\u56de\u7b54\u539f\u59cb\u95ee\u9898\u3002&#039;]<\/code><\/pre>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/MultiQueryRetriever\u6267\u884c\u7ed3\u679c.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/MultiQueryRetriever\u6267\u884c\u7ed3\u679c.png\" alt=\"\" \/><\/a><\/p>\n<p><strong>\u7b2c\u4e09\u6b65<\/strong>\uff1a\u4f7f\u7528 create_retrieval_chain \u8fdb\u884c\u5b8c\u6574\u67e5\u8be2<\/p>\n<pre><code class=\"language-python\">from langchain.chains import create_retrieval_chain\nfrom langchain.chains.combine_documents import create_stuff_documents_chain\nfrom langchain_core.prompts import ChatPromptTemplate\n\n# \u521b\u5efa\u7ed3\u5408\u6587\u6863\u7684\u94fe\nprompt = ChatPromptTemplate.from_messages([\n    (&quot;system&quot;, &quot;&quot;&quot;Answer any user questions based solely on the context below:\n&lt;context&gt;\n{context}\n&lt;\/context&gt;&quot;&quot;&quot;),\n    (&quot;placeholder&quot;, &quot;{chat_history}&quot;),\n    (&quot;human&quot;, &quot;{input}&quot;),\n])\n\ncombine_docs_chain = create_stuff_documents_chain(\n    llm=chat_ernie, prompt=prompt\n)\n\n# \u521b\u5efa\u68c0\u7d22\u94fe\nchain = create_retrieval_chain(retriever=retriever_from_llm, combine_docs_chain=combine_docs_chain)\n\n# \u4f7f\u7528\u94fe\u8fdb\u884c\u67e5\u8be2\nresult = chain.invoke(input={&quot;input&quot;: question})\n\n# \u8f93\u51fa\u6700\u7ec8\u7ed3\u679c\nprint(&quot;\u6700\u7ec8\u56de\u7b54\uff1a&quot;, result)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<\/p>\n<pre><code class=\"language-bash\">\u6700\u7ec8\u56de\u7b54\uff1a {&#039;input&#039;: &#039;\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u54ea\u4e9b\u5f62\u6001?&#039;, \n&#039;context&#039;: [\n    Document(metadata={&#039;author&#039;: &#039;\u5434\u627f\u6069&#039;, &#039;creationDate&#039;: &quot;D:20240329064911+00&#039;00&#039;&quot;, &#039;creator&#039;: &#039;calibre 3.23.0 [https:\/\/calibre-ebook.com]&#039;, &#039;file_path&#039;: &#039;testfiles\/\u897f\u6e38\u8bb0.pdf&#039;, &#039;format&#039;: &#039;PDF 1.4&#039;, &#039;keywords&#039;: &#039;&#039;, &#039;modDate&#039;: &#039;&#039;, &#039;page&#039;: 7, &#039;producer&#039;: &#039;calibre 3.23.0 [https:\/\/calibre-ebook.com]&#039;, &#039;source&#039;: &#039;testfiles\/\u897f\u6e38\u8bb0.pdf&#039;, &#039;subject&#039;: &#039;&#039;, &#039;title&#039;: &#039;\u897f\u6e38\u8bb0\uff08\u4eba\u6587\u793e\u7ecf\u5178\u5f69\u76ae\u7248\uff0c\u957f\u950070\u5e74\uff0c\u4ee5\u660e\u4ee3\u4e16\u5fb7\u5802\u672c\u4e3a\u5e95\u672c\uff1b\u4e09\u6b21\u4fee\u8ba2\u91cd\u6821\uff1b\u8c46\u74e3\u4e0a\u4e07\u6761\u8bc4\u8bba\uff1b2020\u5e74\u6559\u80b2\u90e8\u6307\u5bfc\u76ee\u5f55\u56fe\u4e66\uff09&#039;, &#039;total_pages&#039;: 675, &#039;trapped&#039;: &#039;&#039;}, page_content=&#039;\u4e86\u8bb8\u591a\u65b0\u7684\u6210\u679c\uff0c\u4e3a\u4e86\u80fd\u8ba9\u5e7f\u5927\u8bfb\u8005\u66f4\u597d\u5730\u7406\u89e3\u8be5\u4f5c\u54c1\uff0c\u8fd9\u6b21\u7279\u610f\u9080\u8bf7\u5317\u4eac\u5927\u5b66\u5218\u52c7\u5f3a\u6559\u6388\u91cd\u65b0\u4e3a\u8be5\u4e66\u64b0\\n\u5199\u4e86\u524d\u8a00\u3002\\n\u516d\u3001\u5173\u4e8e\u53d6\u7ecf\u9014\u4e2d\u6240\u9047\u7684\u516b\u5341\u4e00\u96be\u987a\u5e8f\uff0c\u7b2c\u4e5d\u5341\u4e5d\u56de\u8bf8\u795e\u7ed9\u89c2\u97f3\u83e9\u8428\u63d0\u4f9b\u7684\u7c3f\u5b50\u6240\u8bb0\uff0c\u4e0e\u5c0f\u8bf4\u7684\u53d9\u8ff0&#039;), \n    ....\uff08\u5185\u5bb9\u8fc7\u591a\uff0c\u6b64\u5904\u7701\u7565\uff09\n    Document(metadata={&#039;author&#039;: &#039;\u5434\u627f\u6069&#039;, &#039;creationDate&#039;: &quot;D:20240329064911+00&#039;00&#039;&quot;, &#039;creator&#039;: &#039;calibre 3.23.0 [https:\/\/calibre-ebook.com]&#039;, &#039;file_path&#039;: &#039;testfiles\/\u897f\u6e38\u8bb0.pdf&#039;, &#039;format&#039;: &#039;PDF 1.4&#039;, &#039;keywords&#039;: &#039;&#039;, &#039;modDate&#039;: &#039;&#039;, &#039;page&#039;: 6, &#039;producer&#039;: &#039;calibre 3.23.0 [https:\/\/calibre-ebook.com]&#039;, &#039;source&#039;: &#039;testfiles\/\u897f\u6e38\u8bb0.pdf&#039;, &#039;subject&#039;: &#039;&#039;, &#039;title&#039;: &#039;\u897f\u6e38\u8bb0\uff08\u4eba\u6587\u793e\u7ecf\u5178\u5f69\u76ae\u7248\uff0c\u957f\u950070\u5e74\uff0c\u4ee5\u660e\u4ee3\u4e16\u5fb7\u5802\u672c\u4e3a\u5e95\u672c\uff1b\u4e09\u6b21\u4fee\u8ba2\u91cd\u6821\uff1b\u8c46\u74e3\u4e0a\u4e07\u6761\u8bc4\u8bba\uff1b2020\u5e74\u6559\u80b2\u90e8\u6307\u5bfc\u76ee\u5f55\u56fe\u4e66\uff09&#039;, &#039;total_pages&#039;: 675, &#039;trapped&#039;: &#039;&#039;}, page_content=&#039;\u4e94\u3001\u66f4\u6362\u524d\u8a00\u3002\u672c\u4e66\u7684\u524d\u8a00\uff0c\u8fc7\u53bb\u4e00\u76f4\u6cbf\u7528\u534e\u4e1c\u5e08\u8303\u5927\u5b66\u90ed\u8c6b\u9002\u3001\u7b80\u8302\u68ee\u6559\u6388\u4e00\u4e5d\u4e03\u4e8c\u5e74\u6240\u5199\u7684\u6587\\n\u5b57\uff0c\u9650\u4e8e\u5f53\u65f6\u7684\u5386\u53f2\u73af\u5883\uff0c\u653f\u6cbb\u5316\u8272\u5f69\u8f83\u6d53\uff0c\u800c\u300a\u897f\u6e38\u8bb0\u300b\u7814\u7a76\u5728\u8fc7\u53bb\u7684\u51e0\u5341\u5e74\u4e2d\u53d6\u5f97\u4e86\u5f88\u5927\u53d1\u5c55\uff0c\u51fa\u73b0&#039;)], \n    &#039;answer&#039;: &#039;\u6839\u636e\u539f\u6587\u4fe1\u606f\u5f97\u51fa\uff0c\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u7f8e\u4e3d\u7684\u6751\u59d1\u3001\u5e74\u6ee1\u516b\u65ec\u7684\u8001\u5987\u4eba\u3001\u548c\u4e00\u4f4d\u767d\u53d1\u82cd\u82cd\u7684\u8001\u516c\u516c\u3002&#039;}<\/code><\/pre>\n<p>\u901a\u8fc7\u4ee5\u4e0a\u5b9e\u8df5\uff0c\u53ef\u4ee5\u770b\u5230\uff1a<br \/>\n1\u3001MultiQueryRetriever\u4f1a\u501f\u52a9\u5927\u6a21\u578b\u751f\u6210\u65b0\u7684\u591a\u4e2a\u67e5\u8be2 queries\uff1b<br \/>\n2\u3001MultiQueryRetriever\u4f1a\u901a\u8fc7\u8fd9\u4e9b queries \u68c0\u7d22\u51fa\u76f8\u5173\u7684\u6587\u6863\uff1b<br \/>\n3\u3001\u6700\u540e\uff0c\u901a\u8fc7 combine_docs_chain \u5c06\u68c0\u7d22\u51fa\u7684\u6587\u6863\u4ea4\u7ed9\u5927\u6a21\u578b\u5f97\u5230\u6700\u7ec8\u7b54\u6848\u3002<\/p>\n<h3><span class=\"ez-toc-section\" id=\"%E7%BB%93%E5%90%88%E6%A3%80%E7%B4%A2%E5%99%A8_EnsembleRetriever\"><\/span>\u7ed3\u5408\u68c0\u7d22\u5668 EnsembleRetriever<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p><strong>\u7b80\u4ecb<\/strong>:<br \/>\nEnsembleRetriever\u662f\u4e00\u79cd\u7ed3\u5408\u591a\u4e2a\u68c0\u7d22\u5668\u7ed3\u679c\u7684\u7b97\u6cd5\uff0c\u901a\u8fc7\u91cd\u65b0\u6392\u5e8f\u6765\u63d0\u9ad8\u68c0\u7d22\u6548\u679c\u3002<\/p>\n<p><strong>\u529f\u80fd<\/strong>:<br \/>\n\u8be5\u7b97\u6cd5\u4ece\u591a\u4e2a\u68c0\u7d22\u5668\u4e2d\u83b7\u53d6\u6587\u6863\uff0c\u5e76\u5c06\u5b83\u4eec\u7ec4\u5408\u5728\u4e00\u8d77\uff0c\u4ee5\u63d0\u9ad8\u6587\u672c\u76f8\u4f3c\u6027\u5339\u914d\u548c\u4fe1\u606f\u68c0\u7d22\u7684\u51c6\u786e\u6027\u3002\u901a\u8fc7\u7ed3\u5408\u591a\u79cd\u8865\u5145\u7684\u5411\u91cf\u641c\u7d22\u7b97\u6cd5\uff0cEnsembleRetriever\u63d0\u4f9b\u4e86\u6700\u5148\u8fdb\u7684\u6587\u672c\u76f8\u4f3c\u6027\u5339\u914d\u548c\u4fe1\u606f\u68c0\u7d22\u80fd\u529b\u3002<\/p>\n<p><strong>\u4f7f\u7528\u573a\u666f<\/strong>:<br \/>\n\u5f53\u9700\u8981\u7ed3\u5408\u591a\u79cd\u68c0\u7d22\u65b9\u6cd5\u4ee5\u83b7\u5f97\u66f4\u9ad8\u7684\u68c0\u7d22\u51c6\u786e\u6027\u65f6\uff0cEnsembleRetriever\u662f\u7406\u60f3\u7684\u9009\u62e9\u3002\u8fd9\u79cd\u65b9\u6cd5\u9002\u7528\u4e8e\u9700\u8981\u4ece\u5927\u91cf\u6587\u6863\u96c6\u5408\u4e2d\u8fdb\u884c\u4fe1\u606f\u68c0\u7d22\u7684\u5e94\u7528\u573a\u666f<\/p>\n<p><strong>\u4f7f\u7528\u65b9\u6cd5<\/strong><br \/>\n<strong>\u7b2c\u4e00\u6b65<\/strong>\uff1a\u5b89\u88c5\u4f9d\u8d56\u5305<\/p>\n<pre><code class=\"language-bash\">pip install rank_bm25\npip install faiss-gpu<\/code><\/pre>\n<p><strong>\u7b2c\u4e8c\u6b65<\/strong>\uff1a\u51c6\u5907\u77e5\u8bc6\u6570\u636e<\/p>\n<pre><code class=\"language-bash\">from langchain.retrievers import EnsembleRetriever\nfrom langchain_community.retrievers import BM25Retriever\nfrom langchain_community.vectorstores import FAISS\n\n# \u521d\u59cb\u5316 HuggingFaceEmbeddings\nembedding = HuggingFaceEmbeddings(model_name=&quot;bert-base-chinese&quot;)\n\n# \u4e2d\u6587\u6587\u6863\u5217\u8868\ndoc_list_1 = [\n    &quot;\u6211\u559c\u6b22\u82f9\u679c&quot;,\n    &quot;\u6211\u559c\u6b22\u6a59\u5b50&quot;,\n    &quot;\u82f9\u679c\u548c\u6a59\u5b50\u90fd\u662f\u6c34\u679c&quot;,\n]\n\ndoc_list_2 = [\n    &quot;\u4f60\u559c\u6b22\u82f9\u679c\u5417\uff1f&quot;,\n    &quot;\u4f60\u559c\u6b22\u6a59\u5b50\u5417\uff1f&quot;,\n]\n<\/code><\/pre>\n<p><strong>\u7b2c\u4e09\u6b65<\/strong>\uff1a\u521b\u5efa\u7ec4\u5408\u68c0\u7d22\u5668<\/p>\n<pre><code class=\"language-python\">\n# \u521d\u59cb\u5316 BM25 \u68c0\u7d22\u5668\nbm25_retriever = BM25Retriever.from_texts(\n    doc_list_1, metadatas=[{&quot;source&quot;: 1}] * len(doc_list_1)\n)\nbm25_retriever.k = 2\n\n# \u521b\u5efa FAISS \u5411\u91cf\u5b58\u50a8 \nfaiss_vectorstore = FAISS.from_texts(\n    doc_list_2, embedding, metadatas=[{&quot;source&quot;: 2}] * len(doc_list_2)\n)\nfaiss_retriever = faiss_vectorstore.as_retriever(search_kwargs={&quot;k&quot;: 2})\n\n# \u521d\u59cb\u5316\u7ec4\u5408\u68c0\u7d22\u5668\nensemble_retriever = EnsembleRetriever(\n    retrievers=[bm25_retriever, faiss_retriever], weights=[0.5, 0.5]\n)<\/code><\/pre>\n<p><strong>\u7b2c\u56db\u6b65<\/strong>\uff1a\u8fdb\u884c\u67e5\u8be2<\/p>\n<pre><code class=\"language-python\"># \u8f93\u5165\u67e5\u8be2\ndocs = ensemble_retriever.invoke(&quot;\u6211\u60f3\u77e5\u9053\u5173\u4e8e\u82f9\u679c\u7684\u4fe1\u606f&quot;)\nprint(docs)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<\/p>\n<pre><code class=\"language-bash\">[\n    Document(metadata={&#039;source&#039;: 1}, page_content=&#039;\u82f9\u679c\u548c\u6a59\u5b50\u90fd\u662f\u6c34\u679c&#039;), \n    Document(metadata={&#039;source&#039;: 2}, page_content=&#039;\u4f60\u559c\u6b22\u82f9\u679c\u5417\uff1f&#039;), \n    Document(metadata={&#039;source&#039;: 1}, page_content=&#039;\u6211\u559c\u6b22\u6a59\u5b50&#039;), \n    Document(metadata={&#039;source&#039;: 2}, page_content=&#039;\u4f60\u559c\u6b22\u6a59\u5b50\u5417\uff1f&#039;)\n]<\/code><\/pre>\n<p>\u8bf4\u660e\uff1a<\/p>\n<ul>\n<li>BM25Retriever \u662f\u4e00\u79cd\u57fa\u4e8e\u7ecf\u5178\u4fe1\u606f\u68c0\u7d22\u6a21\u578b BM25 \u7684\u68c0\u7d22\u5668\u3002\u5b83\u7684\u4f18\u70b9:\n<ul>\n<li>\u7b80\u5355\u6613\u7528\uff0c\u9002\u5408\u5904\u7406\u77ed\u6587\u672c\u548c\u5173\u952e\u8bcd\u68c0\u7d22\u3002<\/li>\n<li>\u5bf9\u4e8e\u4f20\u7edf\u7684\u6587\u672c\u5339\u914d\u4efb\u52a1\u8868\u73b0\u826f\u597d\u3002<\/li>\n<\/ul>\n<\/li>\n<li>FAISS\uff08Facebook AI Similarity Search\uff09\u662f\u4e00\u4e2a\u9ad8\u6548\u7684\u76f8\u4f3c\u6027\u641c\u7d22\u5e93\uff0c\u4e13\u95e8\u7528\u4e8e\u5904\u7406\u5927\u89c4\u6a21\u5411\u91cf\u6570\u636e\u3002\u5b83\u7684\u4f18\u70b9\uff1a\n<ul>\n<li>\u9002\u5408\u5904\u7406\u590d\u6742\u7684\u8bed\u4e49\u68c0\u7d22\u4efb\u52a1\uff0c\u5c24\u5176\u662f\u5728\u5411\u91cf\u7a7a\u95f4\u4e2d\u3002<\/li>\n<li>\u80fd\u591f\u5904\u7406\u5927\u89c4\u6a21\u6570\u636e\u96c6\uff0c\u68c0\u7d22\u901f\u5ea6\u5feb\u3002<\/li>\n<\/ul>\n<\/li>\n<li>\u5c06 BM25Retriever \u548c FAISS \u7ec4\u5408\u5728\u4e00\u8d77\uff1a\n<ul>\n<li>\u4e92\u8865\u6027\uff1aBM25 \u66f4\u9002\u5408\u5904\u7406\u57fa\u4e8e\u5173\u952e\u8bcd\u7684\u68c0\u7d22\uff0c\u80fd\u591f\u6709\u6548\u5730\u4ece\u6587\u672c\u4e2d\u627e\u5230\u76f8\u5173\u6587\u6863\uff1bFAISS \u5219\u64c5\u957f\u5904\u7406\u8bed\u4e49\u76f8\u4f3c\u6027\uff0c\u901a\u8fc7\u5411\u91cf\u5316\u8868\u793a\u6355\u6349\u6587\u672c\u7684\u6df1\u5c42\u542b\u4e49\u3002<\/li>\n<li>\u63d0\u9ad8\u68c0\u7d22\uff1a\u901a\u8fc7\u7ec4\u5408\u4e24\u79cd\u65b9\u6cd5\uff0c\u53ef\u4ee5\u5145\u5206\u5229\u7528 BM25 \u7684\u8bcd\u9891\u7279\u6027\u548c FAISS \u7684\u5411\u91cf\u76f8\u4f3c\u6027\uff0c\u4ece\u800c\u63d0\u9ad8\u6574\u4f53\u68c0\u7d22\u7684\u51c6\u786e\u6027\u548c\u5168\u9762\u6027\u3002<\/li>\n<\/ul>\n<\/li>\n<\/ul>\n<h3><span class=\"ez-toc-section\" id=\"%E9%95%BF%E4%B8%8A%E4%B8%8B%E6%96%87%E9%87%8D%E6%8E%92%E5%BA%8F_LongContextReorder\"><\/span>\u957f\u4e0a\u4e0b\u6587\u91cd\u6392\u5e8f LongContextReorder<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p><strong>\u7b80\u4ecb<\/strong>:<br \/>\nLongContextReorder\u662f\u4e00\u79cd\u7528\u4e8e\u5904\u7406\u957f\u4e0a\u4e0b\u6587\u4fe1\u606f\u7684\u6280\u672f\uff0c\u65e8\u5728\u63d0\u9ad8\u6a21\u578b\u5728\u957f\u6587\u672c\u4e2d\u7684\u4fe1\u606f\u63d0\u53d6\u548c\u7406\u89e3\u80fd\u529b\u3002\u5b83\u901a\u8fc7\u91cd\u65b0\u6392\u5e8f\u6587\u6863\uff0c\u4ee5\u4f7f\u6700\u76f8\u5173\u7684\u4fe1\u606f\u66f4\u6613\u4e8e\u88ab\u6a21\u578b\u6355\u6349\u3002<\/p>\n<p><strong>\u529f\u80fd<\/strong>:<br \/>\n<strong>\u4fe1\u606f\u91cd\u6392\u5e8f<\/strong>: LongContextReorder\u4ece\u591a\u4e2a\u68c0\u7d22\u5668\u4e2d\u83b7\u53d6\u6587\u6863\uff0c\u5e76\u5bf9\u5b83\u4eec\u8fdb\u884c\u91cd\u65b0\u6392\u5e8f\uff0c\u4f7f\u5f97\u6700\u76f8\u5173\u7684\u6587\u6863\u4f4d\u4e8e\u4e0a\u4e0b\u6587\u7a97\u53e3\u7684\u5f00\u5934\u548c\u7ed3\u5c3e\u3002\u8fd9\u6709\u52a9\u4e8e\u6a21\u578b\u66f4\u597d\u5730\u5173\u6ce8\u6574\u4e2a\u4e0a\u4e0b\u6587\u4e2d\u7684\u5173\u952e\u5185\u5bb9\u3002<br \/>\n\u4e0a\u4e0b\u6587\u4f18\u5316: \u901a\u8fc7\u4f18\u5316\u4e0a\u4e0b\u6587\u7684\u6392\u5217\uff0c\u6a21\u578b\u80fd\u591f\u66f4\u6709\u6548\u5730\u5229\u7528\u957f\u6587\u672c\u4e2d\u7684\u4fe1\u606f\uff0c\u4ece\u800c\u63d0\u9ad8\u56de\u7b54\u7684\u51c6\u786e\u6027\u548c\u76f8\u5173\u6027\u3002<\/p>\n<p><strong>\u4f7f\u7528\u573a\u666f<\/strong>:<br \/>\n\u8fd9\u79cd\u6280\u672f\u7279\u522b\u9002\u5408\u9700\u8981\u5728\u957f\u6587\u672c\u4e2d\u63d0\u53d6\u5173\u952e\u4fe1\u606f\u7684\u5e94\u7528\u573a\u666f\uff0c\u6bd4\u5982\u6cd5\u5f8b\u6587\u4e66\u5206\u6790\u3001\u5b66\u672f\u8bba\u6587\u9605\u8bfb\u548c\u957f\u7bc7\u6545\u4e8b\u7406\u89e3\u7b49\u3002<\/p>\n<p><strong>\u4f7f\u7528\u65b9\u6cd5<\/strong>\uff1a<\/p>\n<p><strong>\u7b2c\u4e00\u6b65<\/strong>\uff1a\u542f\u52a8 Chroma \u6570\u636e\u5e93<\/p>\n<pre><code class=\"language-bash\">chroma run --path chroma_test --port 8000<\/code><\/pre>\n<p>\u8bf4\u660e\uff1a<\/p>\n<ul>\n<li>\u6b64\u5904\u662f\u907f\u514d\u4e0e\u524d\u9762\u7684\u4ee3\u7801\u4ea7\u751f\u6570\u636e\u6c61\u67d3\uff0c\u6240\u4ee5\u6700\u597d\u5173\u95ed\u4e4b\u524d\u7684chroma\u6570\u636e\u5e93\uff0c\u91cd\u65b0\u542f\u52a8\u4e00\u4e2a\u65b0\u7684\u3002<\/li>\n<\/ul>\n<p><strong>\u7b2c\u4e8c\u6b65<\/strong>\uff1a\u51c6\u5907\u6570\u636e<\/p>\n<pre><code class=\"language-python\">import os\nfrom langchain.chains import LLMChain, StuffDocumentsChain\nfrom langchain.prompts import PromptTemplate\nfrom langchain_chroma import Chroma\nfrom langchain_community.document_transformers import (\n    LongContextReorder,\n)\nfrom langchain_community.embeddings import HuggingFaceEmbeddings\n\n# \u6d4b\u8bd5\u6570\u636e\ntexts = [\n    &quot;\u7bee\u7403\u662f\u4e00\u9879\u5f88\u68d2\u7684\u8fd0\u52a8\u3002&quot;,\n    &quot;\u300aFly me to the moon\u300b \u662f\u6211\u6700\u559c\u6b22\u7684\u6b4c\u66f2\u4e4b\u4e00\u3002&quot;,\n    &quot;\u51ef\u5c14\u7279\u4eba\u662f\u6211\u6700\u559c\u6b22\u7684\u7403\u961f\u3002&quot;,\n    &quot;\u8fd9\u662f\u5173\u4e8e\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u7684\u4e00\u7bc7\u6587\u7ae0\u3002&quot;,\n    &quot;\u6211\u6700\u559c\u6b22\u7684\u6e38\u620f\u662f\u300a\u9ed1\u795e\u8bdd\uff1a\u609f\u7a7a\u300b&quot;,\n    &quot;\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u4ee520\u5206\u7684\u4f18\u52bf\u8d62\u5f97\u4e86\u6bd4\u8d5b\u3002&quot;,\n    &quot;\u5728\u300a\u897f\u6e38\u8bb0\u300b\u4e2d\uff0c\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u6751\u59d1\u3001\u8001\u5987\u548c\u8001\u7fc1\u8fd9\u4e09\u79cd\u5f62\u6001\u3002&quot;\n    &quot;\u5b59\u609f\u7a7a\u4e09\u5927\u767d\u9aa8\u7cbe\u662f\u897f\u6e38\u8bb0\u4e2d\u4e00\u6bb5\u7cbe\u5f69\u7684\u7bc7\u7ae0\u3002&quot;,\n    &quot;L. Kornet \u662f\u51ef\u5c14\u7279\u4eba\u961f\u4e2d\u6700\u4f18\u79c0\u7684\u7403\u5458\u4e4b\u4e00&quot;,\n    &quot;Larry Bird \u662f\u4e00\u4f4d\u6807\u5fd7\u6027\u7684NBA\u7403\u5458\u3002&quot;,\n]\n# \u521d\u59cb\u5316 HuggingFaceEmbeddings\nembeddings = HuggingFaceEmbeddings(model_name=&quot;bert-base-chinese&quot;)<\/code><\/pre>\n<p><strong>\u7b2c\u4e09\u6b65<\/strong>\uff1a\u521b\u5efaRetriever\u5e76\u67e5\u8be2\u76f8\u5173\u4fe1\u606f<\/p>\n<pre><code class=\"language-python\"># \u521b\u5efa\u4e00\u4e2a retriever\nretriever = Chroma.from_texts(texts, embedding=embeddings).as_retriever(\n    search_kwargs={&quot;k&quot;: 10}\n)\n\nquery = &quot;\u8bf7\u544a\u8bc9\u6211\u5173\u4e8e\u767d\u9aa8\u7cbe\u7684\u4e8b\u60c5&quot;\n\n# Get relevant documents ordered by relevance score\ndocs = retriever.get_relevant_documents(query)\nfor doc in docs:\n    print(doc.page_content)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<\/p>\n<pre><code class=\"language-bash\">\u5728\u300a\u897f\u6e38\u8bb0\u300b\u4e2d\uff0c\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u6751\u59d1\u3001\u8001\u5987\u548c\u8001\u7fc1\u8fd9\u4e09\u79cd\u5f62\u6001\u3002\u5b59\u609f\u7a7a\u4e09\u5927\u767d\u9aa8\u7cbe\u662f\u897f\u6e38\u8bb0\u4e2d\u4e00\u6bb5\u7cbe\u5f69\u7684\u7bc7\u7ae0\u3002\n\u8fd9\u662f\u5173\u4e8e\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u7684\u4e00\u7bc7\u6587\u7ae0\u3002\n\u6211\u6700\u559c\u6b22\u7684\u6e38\u620f\u662f\u300a\u9ed1\u795e\u8bdd\uff1a\u609f\u7a7a\u300b\nL. Kornet \u662f\u51ef\u5c14\u7279\u4eba\u961f\u4e2d\u6700\u4f18\u79c0\u7684\u7403\u5458\u4e4b\u4e00\n\u300aFly me to the moon\u300b \u662f\u6211\u6700\u559c\u6b22\u7684\u6b4c\u66f2\u4e4b\u4e00\u3002\n\u51ef\u5c14\u7279\u4eba\u662f\u6211\u6700\u559c\u6b22\u7684\u7403\u961f\u3002\nLarry Bird \u662f\u4e00\u4f4d\u6807\u5fd7\u6027\u7684NBA\u7403\u5458\u3002\n\u7bee\u7403\u662f\u4e00\u9879\u5f88\u68d2\u7684\u8fd0\u52a8\u3002\n\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u4ee520\u5206\u7684\u4f18\u52bf\u8d62\u5f97\u4e86\u6bd4\u8d5b\u3002<\/code><\/pre>\n<p><strong>\u7b2c\u56db\u6b65<\/strong>\uff1a\u4f7f\u7528LongContextReorder\u8fdb\u884c\u91cd\u6392\u5e8f<\/p>\n<pre><code class=\"language-python\">reordering = LongContextReorder()\nreordered_docs = reordering.transform_documents(docs)\n\nfor doc in reordered_docs:\n    print(doc.page_content)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<\/p>\n<pre><code class=\"language-bash\">\u5728\u300a\u897f\u6e38\u8bb0\u300b\u4e2d\uff0c\u5b59\u609f\u7a7a\u4e09\u6253\u767d\u9aa8\u7cbe\u65f6\uff0c\u767d\u9aa8\u7cbe\u5206\u522b\u53d8\u6210\u4e86\u6751\u59d1\u3001\u8001\u5987\u548c\u8001\u7fc1\u8fd9\u4e09\u79cd\u5f62\u6001\u3002\u5b59\u609f\u7a7a\u4e09\u5927\u767d\u9aa8\u7cbe\u662f\u897f\u6e38\u8bb0\u4e2d\u4e00\u6bb5\u7cbe\u5f69\u7684\u7bc7\u7ae0\u3002\n\u6211\u6700\u559c\u6b22\u7684\u6e38\u620f\u662f\u300a\u9ed1\u795e\u8bdd\uff1a\u609f\u7a7a\u300b\n\u300aFly me to the moon\u300b \u662f\u6211\u6700\u559c\u6b22\u7684\u6b4c\u66f2\u4e4b\u4e00\u3002\nLarry Bird \u662f\u4e00\u4f4d\u6807\u5fd7\u6027\u7684NBA\u7403\u5458\u3002\n\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u4ee520\u5206\u7684\u4f18\u52bf\u8d62\u5f97\u4e86\u6bd4\u8d5b\u3002\n\u7bee\u7403\u662f\u4e00\u9879\u5f88\u68d2\u7684\u8fd0\u52a8\u3002\n\u51ef\u5c14\u7279\u4eba\u662f\u6211\u6700\u559c\u6b22\u7684\u7403\u961f\u3002\nL. Kornet \u662f\u51ef\u5c14\u7279\u4eba\u961f\u4e2d\u6700\u4f18\u79c0\u7684\u7403\u5458\u4e4b\u4e00\n\u8fd9\u662f\u5173\u4e8e\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u7684\u4e00\u7bc7\u6587\u7ae0\u3002<\/code><\/pre>\n<p>\u5bf9\u6bd4\u4e0a\u9762\u7684\u7ed3\u679c\uff0c\u53ef\u4ee5\u770b\u5230\uff0c\u901a\u8fc7\u4f7f\u7528 LongContextReorder\uff0c\u53ef\u4ee5\u5c06\u6587\u6863\u91cd\u65b0\u6392\u5e8f\uff0c\u5c06\u4e0e\u897f\u6e38\u76f8\u5173\u7684\u4fe1\u606f\u6392\u5728\u524d\u9762\uff0c\u6709\u52a9\u4e8e\u63d0\u9ad8\u6a21\u578b\u7684\u7406\u89e3\u80fd\u529b\u3002<\/p>\n<h3><span class=\"ez-toc-section\" id=\"ElasticSearchBM25Retriever\"><\/span>ElasticSearchBM25Retriever<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p><strong>\u7b80\u4ecb<\/strong>:<br \/>\nElasticSearchBM25Retriever\u4f7f\u7528BM25\u7b97\u6cd5\uff0c\u8fd9\u662f\u4fe1\u606f\u68c0\u7d22\u4e2d\u7684\u4e00\u79cd\u7ecf\u5178\u65b9\u6cd5\uff0c\u5e7f\u6cdb\u5e94\u7528\u4e8eElasticSearch\u7b49\u641c\u7d22\u5f15\u64ce\u4e2d\u3002<\/p>\n<p><strong>\u529f\u80fd<\/strong>:<br \/>\nBM25\u662f\u4e00\u79cd\u57fa\u4e8e\u6982\u7387\u6a21\u578b\u7684\u68c0\u7d22\u7b97\u6cd5\uff0c\u80fd\u591f\u6839\u636e\u6587\u6863\u548c\u67e5\u8be2\u4e4b\u95f4\u7684\u8bcd\u9891\u548c\u9006\u6587\u6863\u9891\u7387\uff0c\u8ba1\u7b97\u6587\u6863\u7684\u76f8\u5173\u6027\u5f97\u5206\u3002<\/p>\n<p><strong>\u4f7f\u7528\u573a\u666f<\/strong>:<br \/>\nElasticSearchBM25Retriever\u9002\u7528\u4e8e\u9700\u8981\u9ad8\u6548\u6587\u672c\u641c\u7d22\u7684\u573a\u666f\uff0c\u5c24\u5176\u662f\u5728\u9700\u8981\u5904\u7406\u5927\u91cf\u975e\u7ed3\u6784\u5316\u6587\u672c\u6570\u636e\u65f6\u3002\u5b83\u5728\u641c\u7d22\u5f15\u64ce\u4f18\u5316\u548c\u6587\u672c\u6316\u6398\u4e2d\u975e\u5e38\u6709\u7528\u3002<\/p>\n<p><strong>\u4f7f\u7528\u65b9\u6cd5<\/strong>\uff1a<\/p>\n<p><strong>\u7b2c\u4e00\u6b65<\/strong>\uff1a\u5b89\u88c5\u5fc5\u8981\u7684\u5e93<\/p>\n<pre><code class=\"language-bash\">pip install elasticsearch langchain<\/code><\/pre>\n<p><strong>\u7b2c\u4e8c\u6b65<\/strong>\uff1a\u5b89\u88c5Elasticsearch\u5e76\u542f\u52a8\u670d\u52a1<\/p>\n<ol>\n<li>\u542f\u52a8Elasticsearch\u7684Docker\u5bb9\u5668\uff0c\u786e\u4fdd Elasticsearch \u670d\u52a1\u6b63\u5728\u8fd0\u884c\u3002<\/li>\n<li>\u5728\u6d4f\u89c8\u5668\u4e2d\u8bbf\u95ee <a href=\"http:\/\/localhost:9200\">http:\/\/localhost:9200<\/a> \u53ef\u4ee5\u5f97\u5230\u5982\u4e0b\u5185\u5bb9\u3002<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/es\u670d\u52a1\u5df2\u7ecf\u542f\u52a8.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/es\u670d\u52a1\u5df2\u7ecf\u542f\u52a8.png\" alt=\"\" \/><\/a><\/li>\n<\/ol>\n<blockquote>\n<p>\u8bf4\u660e\uff1aElasticsearch \u7684\u5b89\u88c5\u65b9\u6cd5\u8f83\u957f\uff0c\u7531\u4e8e\u4e0d\u662f\u672c\u7ae0\u7684\u4e3b\u7ebf\u5185\u5bb9\uff0c\u6240\u4ee5\u6211\u5c06\u8fd9\u65b9\u9762\u5185\u5bb9\u653e\u5728\u9644\u5f55\u90e8\u5206\u3002<\/p>\n<\/blockquote>\n<p><strong>\u7b2c\u4e09\u6b65<\/strong>\uff1a\u51c6\u5907\u6570\u636e\u5e76\u521b\u5efa\u7d22\u5f15<\/p>\n<pre><code class=\"language-python\">from elasticsearch import Elasticsearch\nfrom langchain.retrievers import ElasticSearchBM25Retriever\n\nelasticsearch_url = &quot;http:\/\/elastic:mytest@localhost:9200&quot;\n\n# \u521b\u5efa\u68c0\u7d22\u5668\nretriever = ElasticSearchBM25Retriever.create(elasticsearch_url, &quot;langchain-index-5&quot;)\n\n# \u51c6\u5907\u6d4b\u8bd5\u6570\u636e\ndocuments = [\n    &quot;\u7bee\u7403\u662f\u4e00\u9879\u5f88\u68d2\u7684\u8fd0\u52a8\u3002&quot;,\n    &quot;\u300aFly me to the moon\u300b \u662f\u6211\u6700\u559c\u6b22\u7684\u6b4c\u66f2\u4e4b\u4e00\u3002&quot;,\n    &quot;\u51ef\u5c14\u7279\u4eba\u662f\u6211\u6700\u559c\u6b22\u7684\u7403\u961f\u3002&quot;,\n    &quot;\u8fd9\u662f\u5173\u4e8e\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u7684\u4e00\u7bc7\u6587\u7ae0\u3002&quot;,\n    &quot;\u6211\u6700\u559c\u6b22\u7684\u6e38\u620f\u662f\u300a\u9ed1\u795e\u8bdd\uff1a\u609f\u7a7a\u300b&quot;\n]\n\n# \u6dfb\u52a0\u6587\u672c\nretriever.add_texts(documents)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<\/p>\n<pre><code class=\"language-bash\">[&#039;39c92ff7-4aba-42fb-bc88-2997b5e0c297&#039;,\n &#039;b1e9c357-b67c-43e0-bf95-2591c9e2a103&#039;,\n &#039;e4f964cf-92a0-4b4a-b648-9d0c2f8594b0&#039;,\n &#039;9edcfd38-e954-4bb1-b0d5-68ebf13b3443&#039;,\n &#039;ea0fc62f-6afd-4e27-9f85-a357ef9221a3&#039;]<\/code><\/pre>\n<p>\u8bf4\u660e\uff1a<br \/>\n<code>http:\/\/elastic:mytest@localhost:9200<\/code> \u4e2d\uff1a<\/p>\n<ul>\n<li><code>elastic<\/code> \u662f\u7528\u6237\u540d<\/li>\n<li><code>mytest<\/code> \u662f\u5bc6\u7801<\/li>\n<\/ul>\n<p>\u7b2c\u56db\u6b65\uff1a\u4f7f\u7528 <code>retriever<\/code> \u8fdb\u884c\u67e5\u8be2<\/p>\n<pre><code class=\"language-python\">\n# \u67e5\u8be2\nquery = &quot;\u8bf7\u544a\u8bc9\u6211\u5173\u4e8e\u51ef\u5c14\u7279\u4eba\u7684\u4e8b\u60c5&quot;\ntry:\n    docs = retriever.get_relevant_documents(query)\n\n    # \u8f93\u51fa\u7ed3\u679c\n    for doc in docs:\n        print(doc.page_content)\n        print(&quot;-&quot; * 20)\nexcept Exception as e:\n    print(f&quot;An error occurred: {e}&quot;)<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<\/p>\n<pre><code class=\"language-bash\">\u8fd9\u662f\u5173\u4e8e\u6ce2\u58eb\u987f\u51ef\u5c14\u7279\u4eba\u7684\u4e00\u7bc7\u6587\u7ae0\u3002\n--------------------\n\u51ef\u5c14\u7279\u4eba\u662f\u6211\u6700\u559c\u6b22\u7684\u7403\u961f\u3002\n--------------------\n\u6211\u6700\u559c\u6b22\u7684\u6e38\u620f\u662f\u300a\u9ed1\u795e\u8bdd\uff1a\u609f\u7a7a\u300b\n--------------------\n\u300aFly me to the moon\u300b \u662f\u6211\u6700\u559c\u6b22\u7684\u6b4c\u66f2\u4e4b\u4e00\u3002\n--------------------\n\u7bee\u7403\u662f\u4e00\u9879\u5f88\u68d2\u7684\u8fd0\u52a8\u3002\n--------------------<\/code><\/pre>\n<h2><span class=\"ez-toc-section\" id=\"%E8%87%AA%E5%AE%9A%E4%B9%89%E4%B8%80%E4%B8%AAretriever\"><\/span>\u81ea\u5b9a\u4e49\u4e00\u4e2aretriever<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p>(\u5f85\u8865\u5145)<\/p>\n<h2><span class=\"ez-toc-section\" id=\"%E9%99%84%E5%BD%95\"><\/span>\u9644\u5f55<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<h3><span class=\"ez-toc-section\" id=\"ElasticSearch%E7%9A%84Docker%E5%AE%89%E8%A3%85%E6%95%99%E7%A8%8B\"><\/span>ElasticSearch\u7684Docker\u5b89\u88c5\u6559\u7a0b<span class=\"ez-toc-section-end\"><\/span><\/h3>\n<p>\u7531\u4e8e\u5728\u7cfb\u7edf\u73af\u5883\u4e2d\u5b89\u88c5ElasticSearch\u975e\u5e38\u7e41\u7410\uff0c\u9700\u8981\u5b89\u88c5(JDK\u7b49)\u57fa\u7840\u73af\u5883\uff0c\u6240\u4ee5\u6211\u4eec\u4f7f\u7528Docker\u6765\u5b89\u88c5ElasticSearch\u3002<\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E5%AE%89%E8%A3%85Docker\"><\/span>\u5b89\u88c5Docker<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<p>Docker\u7684\u5b89\u88c5\u6559\u7a0b\u6bd4\u8f83\u591a\u4e14\u8be6\u7ec6\uff0c\u6240\u4ee5\u672c\u6587\u4e0d\u518d\u8d58\u8ff0\uff0c\u8be6\u60c5\u8bf7\u67e5\u770b\uff1a<br \/>\n<a href=\"https:\/\/blog.csdn.net\/yohnyang\/article\/details\/138435593\">10\u5206\u949f\u5b66\u4f1aDocker\u7684\u5b89\u88c5\u548c\u4f7f\u7528<\/a><\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E5%88%9B%E5%BB%BA%E7%BD%91%E7%BB%9C\"><\/span>\u521b\u5efa\u7f51\u7edc<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<pre><code class=\"language-python\">docker network create es-net<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u521b\u5efa\u7f51\u7edc.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u521b\u5efa\u7f51\u7edc.png\" alt=\"\" \/><\/a><\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E6%8B%89%E5%8F%96%E9%95%9C%E5%83%8F\"><\/span>\u62c9\u53d6\u955c\u50cf<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<pre><code class=\"language-bash\">docker pull elasticsearch:8.6.0<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u62c9\u53d6\u955c\u50cf.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u62c9\u53d6\u955c\u50cf.png\" alt=\"\" \/><\/a><\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E5%88%9B%E5%BB%BA%E6%8C%82%E8%BD%BD%E7%82%B9%E7%9B%AE%E5%BD%95\"><\/span>\u521b\u5efa\u6302\u8f7d\u70b9\u76ee\u5f55<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<pre><code class=\"language-bash\"># \u9009\u62e9\u5408\u9002\u7684\u76ee\u5f55\u521b\u5efa\u4e09\u4e2a\u6587\u4ef6\u5939\nmkdir -p \/Users\/deadwalk\/Code\/elasticsearch\/data \/Users\/deadwalk\/Code\/elasticsearch\/config \/Users\/deadwalk\/Code\/elasticsearch\/plugins<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u521b\u5efa\u6587\u4ef6\u5939.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u521b\u5efa\u6587\u4ef6\u5939.png\" alt=\"\" \/><\/a><\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E5%90%AF%E5%8A%A8%E5%AE%B9%E5%99%A8\"><\/span>\u542f\u52a8\u5bb9\u5668<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<p>\u547d\u4ee4\u884c\u4e2d\u8f93\u5165\u547d\u4ee4\u542f\u52a8Docker\u5bb9\u5668<\/p>\n<pre><code class=\"language-bash\">docker run -d \\\n--restart=always \\\n--name es \\\n--network es-net \\\n-p 9200:9200 \\\n-p 9300:9300 \\\n--privileged \\\n-v \/Users\/deadwalk\/Code\/elasticsearch\/data:\/usr\/share\/elasticsearch\/data \\\n-v \/Users\/deadwalk\/Code\/elasticsearch\/plugins:\/usr\/share\/elasticsearch\/plugins \\\n-e &quot;discovery.type=single-node&quot; \\\n-e &quot;ES_JAVA_OPTS=-Xms512m -Xmx512m&quot; \\\nelasticsearch:8.6.0\n<\/code><\/pre>\n<p>\u8fd0\u884c\u7ed3\u679c\uff1a<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u542f\u52a8Docker.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u542f\u52a8Docker.png\" alt=\"\" \/><\/a><\/p>\n<p>\u4f7f\u7528 <code>docker ps<\/code> \u53ef\u4ee5\u770b\u5230Docker\u5bb9\u5668\u5df2\u7ecf\u542f\u52a8\u3002<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/PS\u547d\u4ee4\u67e5\u770b.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/PS\u547d\u4ee4\u67e5\u770b.png\" alt=\"\" \/><\/a><\/p>\n<h4><span class=\"ez-toc-section\" id=\"%E4%BF%AE%E6%94%B9elasticsearch%E7%9A%84%E5%AF%86%E7%A0%81\"><\/span>\u4fee\u6539elasticsearch\u7684\u5bc6\u7801<span class=\"ez-toc-section-end\"><\/span><\/h4>\n<p>\u7b2c\u4e00\u6b65\uff1a\u8fdb\u5165es\u5bb9\u5668<\/p>\n<pre><code class=\"language-bash\">docker exec -it es \/bin\/bash<\/code><\/pre>\n<p>\u7b2c\u4e8c\u6b65\uff1a\u547d\u4ee4\u884c\u8f93\u5165\u91cd\u7f6e\u5bc6\u7801\u547d\u4ee4<\/p>\n<pre><code class=\"language-bash\">bin\/elasticsearch-reset-password -i -u elastic<\/code><\/pre>\n<p>\u6839\u636e\u63d0\u793a\u91cd\u7f6e\u5bc6\u7801\uff0c\u4f8b\u5982\uff1amytest<\/p>\n<p>\u7b2c\u4e09\u6b65\uff1a\u4f7f\u7528\u6d4f\u89c8\u5668\u8bbf\u95eehttp:\/\/localhost:9200\/<br \/>\n\u4f7f\u7528\u7528\u6237\u540d <code>elastic<\/code> \u548c\u91cd\u7f6e\u7684\u5bc6\u7801 <code>mytest<\/code> \uff0c\u9a8c\u8bc1\u53ef\u4ee5\u767b\u5f55\u3002<br \/>\n<a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u9a8c\u8bc1elastic.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u9a8c\u8bc1elastic.png\" alt=\"\" \/><\/a><\/p>\n<h2><span class=\"ez-toc-section\" id=\"%E5%86%85%E5%AE%B9%E5%B0%8F%E7%BB%93\"><\/span>\u5185\u5bb9\u5c0f\u7ed3<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<ul>\n<li>RAG\u7cfb\u7edf\u5728\u8fdb\u884cLoad-&gt;Split-&gt;Embedding-&gt;Store-&gt;Query\u6d41\u7a0b\u65f6\uff0c\u9700\u8981\u4f7f\u7528 <code>Retriever<\/code> \u8fdb\u884c\u6587\u6863\u68c0\u7d22\u3002<\/li>\n<li>Retriever\u8fdb\u884c\u6587\u6863\u68c0\u7d22\u65f6\uff0c\u6709\u4e24\u79cd\u65b9\u6cd5\u6784\u5efaChain\u94fe:\u4e00\u79cd\u662f\u4f20\u7edf\u7684\u7ba1\u9053\u7b26\u6784\u5efa\uff0c\u53e6\u4e00\u79cd\u662f\u4f7f\u7528 <code>create_retrieval_chain<\/code> \u3002<\/li>\n<li>\u4f7f\u7528Retriever\u65f6\uff0c\u9664\u4e86\u57fa\u7840\u7684\u5411\u91cf\u5b58\u50a8\u68c0\u7d22\u5668\u4e4b\u5916\uff0c\u8fd8\u53ef\u4ee5\u4f7f\u7528\u591a\u67e5\u8be2\u68c0\u7d22\u5668\uff08<code>MultiQueryRetriever<\/code>\uff09\u3001\u7ed3\u5408\u68c0\u7d22\u5668\uff08<code>EnsembleRetriever<\/code>\uff09\u7b49\u3002<\/li>\n<li><code>MultiQueryRetriever<\/code> \u662f\u4e00\u79cd\u68c0\u7d22\u7b97\u6cd5\uff0c\u5b83\u901a\u8fc7\u4f7f\u7528\u5927\u578b\u8bed\u8a00\u6a21\u578b(LLM)\u751f\u6210\u591a\u4e2a\u67e5\u8be2\uff0c\u4ece\u800c\u81ea\u52a8\u5316\u63d0\u793a\u8c03\u4f18\u8fc7\u7a0b\u3002<\/li>\n<li><code>MultiQueryRetriever<\/code> \u7684\u5de5\u4f5c\u6d41\u7a0b\u5982\u4e0b\uff1a\n<ul>\n<li>1\u3001 <code>MultiQueryRetriever<\/code> \u4f1a\u501f\u52a9\u5927\u6a21\u578b\u751f\u6210\u65b0\u7684\u591a\u4e2a\u67e5\u8be2 <code>queries\uff1b<\/code><\/li>\n<li>2\u3001 <code>MultiQueryRetriever<\/code> \u4f1a\u901a\u8fc7\u8fd9\u4e9b <code>queries<\/code> \u68c0\u7d22\u51fa\u76f8\u5173\u7684\u6587\u6863\uff1b<\/li>\n<li>3\u3001\u6700\u540e\uff0c\u901a\u8fc7 <code>combine_docs_chain<\/code> \u5c06\u68c0\u7d22\u51fa\u7684\u6587\u6863\u4ea4\u7ed9\u5927\u6a21\u578b\u5f97\u5230\u6700\u7ec8\u7b54\u6848\u3002<\/li>\n<\/ul>\n<\/li>\n<li><code>EnsembleRetriever<\/code> \u662f\u4e00\u79cd\u7ed3\u5408\u591a\u4e2a\u68c0\u7d22\u5668\u7ed3\u679c\u7684\u7b97\u6cd5\uff0c\u901a\u8fc7\u91cd\u65b0\u6392\u5e8f\u6765\u63d0\u9ad8\u68c0\u7d22\u6548\u679c\u3002\n<ul>\n<li><code>BM25Retriever<\/code> \u662f\u4e00\u79cd\u57fa\u4e8e\u7ecf\u5178\u4fe1\u606f\u68c0\u7d22\u6a21\u578b BM25 \u7684\u68c0\u7d22\u5668\u3002<\/li>\n<li><code>FAISS\uff08Facebook AI Similarity Search\uff09<\/code> \u662f\u4e00\u4e2a\u9ad8\u6548\u7684\u76f8\u4f3c\u6027\u641c\u7d22\u5e93\uff0c\u4e13\u95e8\u7528\u4e8e\u5904\u7406\u5927\u89c4\u6a21\u5411\u91cf\u6570\u636e\u3002<\/li>\n<li><code>EnsembleRetriever<\/code> \u53ef\u4ee5\u5c06 <code>BM25Retriever<\/code> \u548c <code>FAISS<\/code> \u7ec4\u5408\u4f7f\u7528\uff0c\u4ece\u800c\u63d0\u9ad8\u6574\u4f53\u68c0\u7d22\u7684\u51c6\u786e\u6027\u548c\u5168\u9762\u6027\u3002<\/li>\n<\/ul>\n<\/li>\n<li><code>LongContextReorder<\/code> \u662f\u4e00\u79cd\u7528\u4e8e\u5904\u7406\u957f\u4e0a\u4e0b\u6587\u4fe1\u606f\u7684\u6280\u672f\uff0c\u65e8\u5728\u63d0\u9ad8\u6a21\u578b\u5728\u957f\u6587\u672c\u4e2d\u7684\u4fe1\u606f\u63d0\u53d6\u548c\u7406\u89e3\u80fd\u529b\u3002<\/li>\n<li><code>ElasticSearchBM25Retriever<\/code> \u53ef\u4ee5\u4e0e\u5f00\u6e90\u641c\u7d22\u5f15\u64ce <code>ElasticSearch<\/code> \u8fdb\u884c\u4ea4\u4e92\uff0c\u4ee5\u5b9e\u73b0\u5411\u91cf\u641c\u7d22\u3002 <\/li>\n<\/ul>\n<h2><span class=\"ez-toc-section\" id=\"%E5%8F%82%E8%80%83%E8%B5%84%E6%96%99\"><\/span>\u53c2\u8003\u8d44\u6599<span class=\"ez-toc-section-end\"><\/span><\/h2>\n<p><a href=\"https:\/\/blog.csdn.net\/HRG520JN\/article\/details\/137857134\">LangChain\u6559\u7a0b | Retrival\u4e4bRetrievers\u8be6\u89e3 | \u68c0\u7d22\u5668\u6559\u7a0b<\/a><\/p>\n<p align=\"center\">\u6b22\u8fce\u5173\u6ce8\u516c\u4f17\u53f7\u4ee5\u83b7\u5f97\u6700\u65b0\u7684\u6587\u7ae0\u548c\u65b0\u95fb<\/p>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/09\/\u626b\u7801_\u641c\u7d22\u8054\u5408\u4f20\u64ad\u6837\u5f0f-\u767d\u8272\u7248.bmp\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/09\/\u626b\u7801_\u641c\u7d22\u8054\u5408\u4f20\u64ad\u6837\u5f0f-\u767d\u8272\u7248.bmp\" alt=\"\" \/><\/a><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u524d\u8a00 \u5728\u4e0a\u4e00\u7ae0\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day28\uff1a\u5927 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":20573,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"aside","meta":{"site-sidebar-layout":"default","site-content-layout":"","ast-site-content-layout":"default","site-content-style":"default","site-sidebar-style":"default","ast-global-header-display":"","ast-banner-title-visibility":"","ast-main-header-display":"","ast-hfb-above-header-display":"","ast-hfb-below-header-display":"","ast-hfb-mobile-header-display":"","site-post-title":"","ast-breadcrumbs-content":"","ast-featured-img":"","footer-sml-layout":"","theme-transparent-header-meta":"default","adv-header-id-meta":"","stick-header-meta":"default","header-above-stick-meta":"","header-main-stick-meta":"","header-below-stick-meta":"","astra-migrate-meta-layouts":"set","ast-page-background-enabled":"default","ast-page-background-meta":{"desktop":{"background-color":"var(--ast-global-color-4)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"ast-content-background-meta":{"desktop":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"footnotes":""},"categories":[28],"tags":[71,68],"class_list":["post-20566","post","type-post","status-publish","format-aside","has-post-thumbnail","hentry","category-blog","tag-rag","tag-68","post_format-post-format-aside"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v26.4 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day29\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u4e86\u89e3Retrievers\u89e3\u6790\u5668 - \u4e00\u8d77AI\u6280\u672f<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/17aitech.com\/?p=20566\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/17aitech.com\/?p=20566\",\"url\":\"https:\/\/17aitech.com\/?p=20566\",\"name\":\"\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day29\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u4e86\u89e3Retrievers\u89e3\u6790\u5668 - \u4e00\u8d77AI\u6280\u672f\",\"isPartOf\":{\"@id\":\"https:\/\/17aitech.com\/#website\"},\"primaryImageOfPage\":{\"@id\":\"https:\/\/17aitech.com\/?p=20566#primaryimage\"},\"image\":{\"@id\":\"https:\/\/17aitech.com\/?p=20566#primaryimage\"},\"thumbnailUrl\":\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u5c01\u9762-4.jpeg\",\"datePublished\":\"2024-08-29T08:10:07+00:00\",\"dateModified\":\"2024-10-08T07:08:19+00:00\",\"author\":{\"@id\":\"https:\/\/17aitech.com\/#\/schema\/person\/3d23bb6f7f115fcefc9ae7803a691739\"},\"breadcrumb\":{\"@id\":\"https:\/\/17aitech.com\/?p=20566#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/17aitech.com\/?p=20566\"]}]},{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/17aitech.com\/?p=20566#primaryimage\",\"url\":\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u5c01\u9762-4.jpeg\",\"contentUrl\":\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u5c01\u9762-4.jpeg\",\"width\":683,\"height\":393},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/17aitech.com\/?p=20566#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/17aitech.com\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day29\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u4e86\u89e3Retrievers\u89e3\u6790\u5668\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/17aitech.com\/#website\",\"url\":\"https:\/\/17aitech.com\/\",\"name\":\"\u4e00\u8d77AI\u6280\u672f\",\"description\":\"\u8ba9AI\u77e5\u8bc6\u89e6\u624b\u53ef\u53ca\",\"alternateName\":\"\u4e00\u8d77AI\u6280\u672f\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/17aitech.com\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/17aitech.com\/#\/schema\/person\/3d23bb6f7f115fcefc9ae7803a691739\",\"name\":\"Dongming\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/17aitech.com\/#\/schema\/person\/image\/\",\"url\":\"\/\/17aitech.com\/wp-content\/uploads\/member\/avatars\/238a0b923820dcc5.1732798681.jpg\",\"contentUrl\":\"\/\/17aitech.com\/wp-content\/uploads\/member\/avatars\/238a0b923820dcc5.1732798681.jpg\",\"caption\":\"Dongming\"},\"description\":\"\u89c1\u5929\u5730\uff0c\u89c1\u4f17\u751f\uff0c\u89c1\u81ea\u5df1\u3002\",\"sameAs\":[\"http:\/\/17aitech.com\"],\"url\":\"https:\/\/17aitech.com\/?page_id=33738&user=1\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day29\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u4e86\u89e3Retrievers\u89e3\u6790\u5668 - \u4e00\u8d77AI\u6280\u672f","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/17aitech.com\/?p=20566","schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/17aitech.com\/?p=20566","url":"https:\/\/17aitech.com\/?p=20566","name":"\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day29\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u4e86\u89e3Retrievers\u89e3\u6790\u5668 - \u4e00\u8d77AI\u6280\u672f","isPartOf":{"@id":"https:\/\/17aitech.com\/#website"},"primaryImageOfPage":{"@id":"https:\/\/17aitech.com\/?p=20566#primaryimage"},"image":{"@id":"https:\/\/17aitech.com\/?p=20566#primaryimage"},"thumbnailUrl":"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u5c01\u9762-4.jpeg","datePublished":"2024-08-29T08:10:07+00:00","dateModified":"2024-10-08T07:08:19+00:00","author":{"@id":"https:\/\/17aitech.com\/#\/schema\/person\/3d23bb6f7f115fcefc9ae7803a691739"},"breadcrumb":{"@id":"https:\/\/17aitech.com\/?p=20566#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/17aitech.com\/?p=20566"]}]},{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/17aitech.com\/?p=20566#primaryimage","url":"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u5c01\u9762-4.jpeg","contentUrl":"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/\u5c01\u9762-4.jpeg","width":683,"height":393},{"@type":"BreadcrumbList","@id":"https:\/\/17aitech.com\/?p=20566#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/17aitech.com\/"},{"@type":"ListItem","position":2,"name":"\u3010\u8bfe\u7a0b\u603b\u7ed3\u3011day29\uff1a\u5927\u6a21\u578b\u4e4b\u6df1\u5165\u4e86\u89e3Retrievers\u89e3\u6790\u5668"}]},{"@type":"WebSite","@id":"https:\/\/17aitech.com\/#website","url":"https:\/\/17aitech.com\/","name":"\u4e00\u8d77AI\u6280\u672f","description":"\u8ba9AI\u77e5\u8bc6\u89e6\u624b\u53ef\u53ca","alternateName":"\u4e00\u8d77AI\u6280\u672f","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/17aitech.com\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/17aitech.com\/#\/schema\/person\/3d23bb6f7f115fcefc9ae7803a691739","name":"Dongming","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/17aitech.com\/#\/schema\/person\/image\/","url":"\/\/17aitech.com\/wp-content\/uploads\/member\/avatars\/238a0b923820dcc5.1732798681.jpg","contentUrl":"\/\/17aitech.com\/wp-content\/uploads\/member\/avatars\/238a0b923820dcc5.1732798681.jpg","caption":"Dongming"},"description":"\u89c1\u5929\u5730\uff0c\u89c1\u4f17\u751f\uff0c\u89c1\u81ea\u5df1\u3002","sameAs":["http:\/\/17aitech.com"],"url":"https:\/\/17aitech.com\/?page_id=33738&user=1"}]}},"_links":{"self":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/posts\/20566","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=20566"}],"version-history":[{"count":10,"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/posts\/20566\/revisions"}],"predecessor-version":[{"id":33215,"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/posts\/20566\/revisions\/33215"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/media\/20573"}],"wp:attachment":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=20566"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=20566"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=20566"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}