{"id":12167,"date":"2024-07-07T20:00:00","date_gmt":"2024-07-07T12:00:00","guid":{"rendered":"https:\/\/ihower.tw\/blog\/?p=12167"},"modified":"2025-09-20T15:43:08","modified_gmt":"2025-09-20T07:43:08","slug":"embedding-models","status":"publish","type":"post","link":"https:\/\/ihower.tw\/blog\/12167-embedding-models","title":{"rendered":"\u4f7f\u7528\u7e41\u9ad4\u4e2d\u6587\u8a55\u6e2c\u5404\u5bb6 Embedding \u6a21\u578b\u7684\u6aa2\u7d22\u80fd\u529b"},"content":{"rendered":"\n<blockquote class=\"wp-block-quote is-layout-flow wp-block-quote-is-layout-flow\">\n<p>\u60f3\u7cfb\u7d71\u6027\u5b78\u7fd2\u5982\u4f55\u6253\u9020 LLM\u3001RAG \u548c Agents \u61c9\u7528\u55ce? \u6b61\u8fce\u5831\u540d\u6211\u7684\u8ab2\u7a0b&nbsp;<a href=\"https:\/\/aihao.tw\/llm\">\u5927\u8a9e\u8a00\u6a21\u578b LLM \u61c9\u7528\u958b\u767c\u5de5\u4f5c\u574a<\/a><\/p>\n<\/blockquote>\n\n\n\n<figure class=\"wp-block-image size-large\"><a href=\"https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark.jpg\"><img loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"502\" data-attachment-id=\"12173\" data-permalink=\"https:\/\/ihower.tw\/blog\/12167-embedding-models\/embedding-model-zh-tw-benchmark\" data-orig-file=\"https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark.jpg\" data-orig-size=\"1256,616\" data-comments-opened=\"1\" data-image-meta=\"{&quot;aperture&quot;:&quot;0&quot;,&quot;credit&quot;:&quot;&quot;,&quot;camera&quot;:&quot;&quot;,&quot;caption&quot;:&quot;&quot;,&quot;created_timestamp&quot;:&quot;0&quot;,&quot;copyright&quot;:&quot;&quot;,&quot;focal_length&quot;:&quot;0&quot;,&quot;iso&quot;:&quot;0&quot;,&quot;shutter_speed&quot;:&quot;0&quot;,&quot;title&quot;:&quot;&quot;,&quot;orientation&quot;:&quot;0&quot;}\" data-image-title=\"embedding-model-zh-tw-benchmark\" data-image-description=\"\" data-image-caption=\"\" data-medium-file=\"https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark-300x147.jpg\" data-large-file=\"https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark-1024x502.jpg\" src=\"https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark-1024x502.jpg\" alt=\"\" class=\"wp-image-12173\" srcset=\"https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark-1024x502.jpg 1024w, https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark-300x147.jpg 300w, https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark-768x377.jpg 768w, https:\/\/ihower.tw\/blog\/wp-content\/uploads\/2024\/07\/embedding-model-zh-tw-benchmark.jpg 1256w\" sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/a><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\"> \ud83d\udcca <a href=\"https:\/\/docs.google.com\/spreadsheets\/d\/1zad1tMFp7OmNjUvm_a-Ni22av2uBmqYclVRgJQGUtl0\/edit?usp=sharing\">\u8a55\u4f30\u6578\u64da\u7d50\u679c google spreadsheets \u50b3\u9001\u9580 \u2197\ufe0f<\/a><\/h3>\n\n\n\n<p>Updated(2024\/9\/23): \u65b0\u589e <a href=\"https:\/\/jina.ai\/news\/jina-embeddings-v3-a-frontier-multilingual-embedding-model\/\">Jina Embeddings v3<\/a><br>Updated(2024\/9\/24): \u65b0\u589e <a href=\"https:\/\/blog.voyageai.com\/2024\/09\/18\/voyage-3\/?\">Voyage-3<\/a><br>Updated(2024\/10\/22): \u65b0\u589e <a href=\"https:\/\/docs.mistral.ai\/capabilities\/embeddings\/\">mistral-embed<\/a><br>Updated(2025\/2\/12): \u65b0\u589e <a href=\"https:\/\/blog.voyageai.com\/2025\/01\/07\/voyage-3-large\/\">Voyage-3-Large<\/a>\u3001<a href=\"https:\/\/huggingface.co\/chuxin-llm\/Chuxin-Embedding\">Chuxin-Embedding<\/a>\u3001<a href=\"https:\/\/github.com\/MinishLab\/model2vec\">model2vec<\/a><br>Updated(2025\/2\/12): \u6709\u6e2c <a href=\"https:\/\/huggingface.co\/nvidia\/NV-Embed-v2\">Nvidia NV-Embed v2<\/a>\uff0c\u4f46\u6a21\u578b\u592a\u5927\u672c\u6a5f\u8dd1\u4e0d\u52d5\u6c92\u7d50\u679c<br>Updated(2025\/2\/13): \u65b0\u589e <a href=\"https:\/\/www.nomic.ai\/blog\/posts\/nomic-embed-text-v2\">Nomic Embed Text V2<\/a><br>Updated(2025\/6\/16): \u65b0\u589e <a href=\"https:\/\/blog.voyageai.com\/2025\/05\/20\/voyage-3-5\">Voyage-3.5 \u8ddf Voyage-3.5-lite<\/a>\u3001<a href=\"https:\/\/blog.voyageai.com\/2024\/11\/12\/voyage-multimodal-3\/\">voyage-multimodal-3<\/a>\u3001<a href=\"https:\/\/cohere.com\/blog\/embed-4\">Cohere Embed 4<\/a>\u3001<a href=\"https:\/\/qwenlm.github.io\/zh\/blog\/qwen3-embedding\/\">Qwen3 Embedding 0.6B \u8ddf 4B<\/a><br>Updated(2025\/7\/14): \u65b0\u589e <a href=\"https:\/\/huggingface.co\/jinaai\/jina-embeddings-v4\">Jina Embeddings v4<\/a><br>Updated(2025\/7\/15): \u65b0\u589e <a href=\"https:\/\/developers.googleblog.com\/en\/gemini-embedding-available-gemini-api\/\">gemini-embedding-001<\/a><br>Updated(2025\/9\/5): \u65b0\u589e <a href=\"https:\/\/developers.googleblog.com\/en\/introducing-embeddinggemma\/\">EmbeddingGemma<\/a><br><br>&#8212;<\/p>\n\n\n\n<p>\u5728 RAG \u7cfb\u7d71\u4e2d\uff0c\u5c07\u6587\u5b57\u8f49\u8a9e\u610f\u5411\u91cf\u7684 embedding \u6a21\u578b\uff0c\u662f\u975e\u5e38\u91cd\u8981\u7684\u95dc\u9375\u6aa2\u7d22\u74b0\u7bc0\u3002<br>\u5f88\u591a\u4eba\u5728\u554f\u7e41\u9ad4\u4e2d\u6587\u7684 embedding \u5efa\u8b70\u9078\u54ea\u4e00\u5957\uff0c\u901a\u5e38\u5927\u5bb6\u5c31\u63a8\u85a6\u6bd4\u8f03\u719f\u7684 OpenAI embedding \u6a21\u578b\u3002<br>\u4f46\u5230\u5e95\u54ea\u4e00\u5957\u5ba2\u89c0\u8a55\u6e2c\u6bd4\u8f03\u597d\uff0c\u5728 HuggingFace \u4e0a\u96d6\u7136\u6709\u500b <a href=\"https:\/\/huggingface.co\/spaces\/mteb\/leaderboard\">MTEB<\/a> \u6709 (\u7c21\u9ad4)\u4e2d\u6587\u8a55\u6e2c\uff0c\u4f46\u5e7e\u4e4e\u90fd\u662f\u4e2d\u570b\u6a21\u578b\u9738\u699c\uff0c\u800c\u4e14\u611f\u89ba\u7528\u7c21\u9ad4\u4e2d\u6587\u8a55\u6e2c\u4e0d\u4ee3\u8868\u7e41\u9ad4\u4e2d\u6587\u3002<\/p>\n\n\n\n<p>\u65bc\u662f\u6211\u5c31\u60f3\u81ea\u5df1\u8dd1\u8a55\u6e2c\u770b\u770b\uff0c\u9031\u672b\u82b1\u4e86\u6642\u9593\uff0c\u53c3\u8003\u4e86 Llamaindex \u91dd\u5c0d RAG \u5834\u666f\u8a55\u6e2c Embedding \u6a21\u578b\u7684\u65b9\u6cd5(<a href=\"https:\/\/www.llamaindex.ai\/blog\/boosting-rag-picking-the-best-embedding-reranker-models-42d079022e83\">Boosting RAG: Picking the Best Embedding &amp; Reranker models<\/a>)\uff0c\u4f7f\u7528\u806f\u767c\u79d1\u6574\u7406\u7684 <a href=\"https:\/\/huggingface.co\/datasets\/MediaTek-Research\/TCEval-v2\">TCEval-v2 \u8cc7\u6599\u96c6<\/a>\u4e2d\u7684\u53f0\u9054\u95b1\u8b80\u7406\u89e3\u8cc7\u6599\u96c6 drcd\uff0c\u5176\u4e2d\u6709\u4e0d\u91cd\u8907\u6587\u7ae0\u6bb5\u843d\u5171 1000 \u6bb5\uff0c\u4ee5\u53ca\u5c0d\u61c9\u7684 3493 \u500b\u554f\u984c\u3002<\/p>\n\n\n\n<!--more-->\n\n\n\n<p>\u8a55\u4f30\u65b9\u5f0f\u662f\u5c07\u5168\u90e8\u554f\u984c\uff0c\u4ee5\u53ca\u6bcf\u500b\u554f\u984c\u5c0d\u61c9\u7684\u552f\u4e00\u6b63\u78ba context \u6bb5\u843d\uff0c\u90fd\u8f49\u6210 embedding \u5411\u91cf\uff0c\u7136\u5f8c\u6bcf\u4e00\u984c\u90fd\u53bb\u505a cosine \u76f8\u4f3c\u6027\u641c\u5c0b\uff0c\u8a55\u4f30\u6488\u51fa\u4f86\u7684 context \u662f\u5426\u6e96\u78ba\u3002\u4e5f\u5c31\u662f\u5c07 3493 \u984c\u8981\u5f9e 1000 \u500b contexts \u4e2d\uff0c\u6488\u51fa\u524d 5 \u500b\u6700\u76f8\u4f3c\u7684\uff0c\u8a08\u7b97\u5169\u500b\u6307\u6a19:<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u5e73\u5747 Hit Rate (\u547d\u4e2d\u7387) : \u53d6 top_k \u662f 5\uff0c\u5728\u6488\u51fa\u4f86\u6700\u76f8\u4f3c\u7684 5 \u7b46\u4e2d\uff0c\u662f\u5426\u5305\u542b\u6b63\u78ba context\u3002\u53ea\u8981\u6709\u4e2d\u5c311\u5206\uff0c\u6c92\u4e2d\u662f0\u5206<\/li>\n\n\n\n<li>\u5e73\u5747 Mean Reciprocal Rank (MRR \u5e73\u5747\u5012\u6578\u6392\u540d): \u5728\u6488\u51fa\u4f86\u7684\u4e94\u7b46\u4e2d\uff0c\u6b63\u78ba\u7684 context \u6392\u5728\u7b2c\u5e7e\u540d?\uff0c\u82e5\u6392\u7b2c\u4e00\u5f971\u5206\uff0c\u6392\u7b2c\u4e09\u662f 1\/3 \u5206 (\u53d6\u5012\u6578)\uff0c\u6c92\u4e2d\u5c31\u662f0\u5206<\/li>\n<\/ul>\n\n\n\n<p>\u6211\u6311\u9078\u4e86\u6709\u505a\u591a\u8a9e\u8a00\u7684\u570b\u5916\u5ee0\u5546\u6a21\u578b\uff0c\u4e5f\u5728 MTEB \u4e2d\u6587\u6392\u884c\u4e0a\u6311\u4e86\u4e00\u4e9b\u770b\u8d77\u4f86\u9760\u8b5c\u7684(\u7c21\u9ad4)\u4e2d\u6587\u6a21\u578b\uff0c\u53f0\u5ee0\u6211\u53ea\u67e5\u5230\u5230\u53f0\u667a\u96f2\u6709\u505a\u3002<br>\u5716\u8868\u5c31\u662f\u8a55\u6e2c\u7d50\u679c\uff0c\u4f9d\u7167\u547d\u4e2d\u7387\u6392\u5e8f\u3002<\/p>\n\n\n\n<p>\u6536\u7a6b\u5e7e\u9ede\u5fc3\u5f97:<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u6709\u6c92\u6709\u652f\u63f4\u4e2d\u6587\u5dee\u5f88\u591a\uff0c\u8a18\u5f97\u8981\u6311 multilingual \u591a\u8a9e\u8a00\u7248\u672c\uff0c\u4f8b\u5982 Google Gemini \u7684 text-embedding-004 \u5206\u6578\u8d85\u6158<\/li>\n\n\n\n<li>OpenAI \u4e0d\u662f\u6700\u5f37\u7684\uff0c\u9019\u8a55\u6e2c\u4e2d\u6700\u5f37\u7684\u662f voyage-multilingual-2\uff0c\u547d\u4e2d\u7387 97% \u8d85\u5f37<\/li>\n\n\n\n<li>\u958b\u6e90\u6700\u5f37\u662f \u5fae\u8edf\u7684 multilingual-e5-large \u547d\u4e2d\u7387 95% \u8b9a\u8b9a\uff0c\u53ef\u60dc\u8f38\u5165\u7684 tokens \u4e0a\u9650\u53ea\u6709 512 tokens \u504f\u5c11<\/li>\n\n\n\n<li>\u96a8\u8457 LLM \u7684 context window \u8b8a\u5927\u4e86\uff0c\u6211\u5011\u539f\u59cb\u8cc7\u6599\u5207\u584a(chunking) \u6642\u4e5f\u53ef\u4ee5\u96a8\u4e4b\u8b8a\u5927\u4f86\u907f\u514d\u4e0a\u4e0b\u6587\u5207\u4e0d\u597d\uff0c\u56e0\u6b64\u9019\u592a\u5c0f\u7684 tokens \u9650\u5236\u6703\u4e0d\u597d\u7528<\/li>\n\n\n\n<li>\u5982\u679c\u5206\u6578\u5dee\u4e0d\u591a\uff0c\u53ef\u4ee5\u9078\u5411\u91cf\u7dad\u5ea6\u5c0f\u7684\uff0c\u5132\u5b58\u548c\u8a08\u7b97\u6210\u672c\u8f03\u4f4e<\/li>\n\n\n\n<li>\u7d9c\u5408\u5e7e\u500b trade-off \u56e0\u7d20: \u5411\u91cf\u7dad\u5ea6(\u8ddf\u5132\u5b58\u548c\u8a08\u7b97\u6210\u672c\u6709\u95dc)\u3001\u8f38\u5165\u7684 tokens \u4e0a\u9650(\u8ddf\u5207\u584a\u6709\u95dc\u3001\u8ddf\u90e8\u7f72\u6210\u672c\u6709\u95dc)\u3001API \u50f9\u9322\u3001\u6e96\u78ba\u7387\u6027\u80fd<\/li>\n\n\n\n<li>\u524d\u5e7e\u540d\u5206\u6578\u5176\u5be6\u5728\u4f2f\u4ef2\u4e4b\u9593\uff0c\u611f\u89ba\u984c\u76ee\u9084\u4e0d\u5920\u96e3\uff0c\u6b61\u8fce\u5efa\u8b70\u66f4\u597d\u7684\u8cc7\u6599\u96c6<\/li>\n\n\n\n<li>\u9019\u500b\u8a55\u4f30\u662f\u91dd\u5c0d\u6aa2\u7d22\u5834\u666f\uff0c\u800c embedding \u9084\u53ef\u4ee5\u62ff\u4f86\u505a \u5206\u985e(classification) \u8ddf \u5206\u7fa4(clustering)\uff0c\u9019\u500b\u6c92\u6e2c<\/li>\n\n\n\n<li>\u6709\u4e9b\u6a21\u578b\u56e0\u6b64\u8a2d\u8a08\u53ef\u4ee5\u50b3\u53c3\u6578\u8868\u793a\u76ee\u524d\u662f\u4ec0\u9ebc\u5834\u666f\uff0c\u4f8b\u5982 Cohere \u8ddf Voyage \u6709\u500b input_type \u53c3\u6578\uff0c\u53ef\u4ee5\u6307\u5b9a\u662f search_query, search_document, classification \u6216 clustering\uff0c\u9019\u6a23\u6548\u80fd\u6703\u66f4\u597d\u4e00\u9ede<\/li>\n\n\n\n<li>\u5176\u5be6\u4e5f\u6c92\u6709\u4e00\u5b9a\u6700\u597d\u7684 embedding \u6a21\u578b\uff0c\u9700\u8981\u5728\u4f60\u81ea\u5df1\u7684\u8cc7\u6599\u96c6\u4e0a\u9762\u8dd1\u8a55\u4f30\u624d\u80fd\u6c7a\u5b9a\u6700\u597d\u6a21\u578b\uff0c\u63a8\u85a6 Weaviate \u7684\u6587\u7ae0 <a href=\"https:\/\/weaviate.io\/blog\/how-to-choose-an-embedding-model\">Step-by-Step Guide to Choosing the Best Embedding Model for Your Application<\/a><\/li>\n\n\n\n<li>\u958b\u6e90 embedding \u6a21\u578b\u4e5f\u53ef\u4ee5\u6839\u64da\u4f60\u7684\u8cc7\u6599\u96c6\u505a\u5fae\u8abf\uff0c\u9032\u4e00\u6b65\u63d0\u5347\u6027\u80fd\u3002<\/li>\n\n\n\n<li>\u5b8c\u6574\u7684 RAG \u662f\u500b end-to-end \u7684\u7cfb\u7d71\u6709\u5f88\u591a\u74b0\u7bc0\uff0c\u9019\u500b\u8a55\u6e2c\u53ea\u6e2c embedding \u6a21\u578b\uff0c\u4e26\u4e14\u662f\u5728\u4e00\u500b\u6c92\u6709\u5207\u584a(chunking)\u554f\u984c\u7684\u4e7e\u6de8\u8cc7\u6599\u96c6\u4e0a\u505a\u6e2c\u8a66<\/li>\n<\/ul>\n\n\n\n<p>\u6211\u7684\u5c0f\u7d50\u8ad6:<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u8ffd\u6c42\u6700\u597d\u6027\u80fd\u8a66\u8a66 <a href=\"https:\/\/blog.voyageai.com\/2024\/09\/18\/voyage-3\/\">Voyage-3<\/a><\/li>\n\n\n\n<li>\u4fbf\u5b9c(USD 0.02 per 1M token \u9019\u500b\u50f9\u4f4d) \u597d\u4e0a\u624b\u9078 <a href=\"https:\/\/platform.openai.com\/docs\/guides\/embeddings\">OpenAI text-embedding-3-small<\/a> \u6216 <a href=\"https:\/\/blog.voyageai.com\/2024\/09\/18\/voyage-3\/\">Voyage-3-lite<\/a> \u6216 <a href=\"https:\/\/jina.ai\/news\/jina-embeddings-v3-a-frontier-multilingual-embedding-model\/\">Jina Embeddings v3<\/a><\/li>\n\n\n\n<li>\u958b\u6e90\u6703\u9078 \u5317\u4eac\u667a\u6e90\u4eba\u5de5\u667a\u80fd\u7814\u7a76\u9662 \u7684 <a href=\"https:\/\/huggingface.co\/BAAI\/bge-m3\">bge-m3<\/a> \u6216 <a href=\"https:\/\/huggingface.co\/jinaai\/jina-embeddings-v2-base-zh\">jina-embeddings-v2-base-zh<\/a> (Jina \u662f\u5fb7\u570b\u516c\u53f8\u4f46\u5275\u8fa6\u4eba\u662f\u4e2d\u570b\u4eba) \u6216 <a href=\"https:\/\/jina.ai\/news\/jina-embeddings-v3-a-frontier-multilingual-embedding-model\/\">Jina Embeddings v3<\/a> (\u4f46\u9019\u6388\u6b0a\u662f CC-BY-NC)<\/li>\n\n\n\n<li>\u82e5\u5207\u584a chunk \u90fd\u5c0f\u65bc 512 tokens\uff0c\u53ef\u4ee5\u9078<a href=\"https:\/\/huggingface.co\/intfloat\/multilingual-e5-small\">\u5fae\u8edf e5 \u7cfb\u5217<\/a>\uff0c\u4f8b\u5982\u505a dynamic few-shot prompting \u7684\u5834\u666f\u3002<\/li>\n<\/ul>\n\n\n\n<p>\u8a55\u6e2c\u6578\u64da\u548c\u7a0b\u5f0f\u78bc\uff0c\u8acb\u898b\u7559\u8a00\u9023\u7d50\u3002\u82e5\u6c92\u6e2c\u5230\u7684\u4f60\u60f3\u77e5\u9053\u7684\u6a21\u578b\uff0c\u4e5f\u6b61\u8fce\u7559\u8a00\u544a\u8a34\u6211\u3002<br>\u6700\u5f8c\u611f\u8b1d <a href=\"https:\/\/www.facebook.com\/will.fans\">Will \u4fdd\u54e5<\/a> \u8ddf <a href=\"https:\/\/www.facebook.com\/ai.ycc\">YC<\/a> \u7d66\u6211\u7684\u4e00\u4e9b\u6307\u5c0e\u8ddf\u5efa\u8b70\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">\u8a55\u6e2c\u5be6\u4f5c\u7d30\u7bc0<\/h3>\n\n\n\n<p>\u7a0b\u5f0f\u78bc\u653e\u5728 github \u4e0a\u4e86: <a href=\"https:\/\/github.com\/ihower\/zh-tw-embedding-model-benchmark\">github.com\/ihower\/zh-tw-embedding-model-benchmark<\/a><\/p>\n\n\n\n<p>\u6709\u7528\u5230 <a href=\"https:\/\/supabase.com\/\">supabase<\/a> (\u4e00\u500b PostgreSQL \u7dda\u4e0a\u670d\u52d9) \u4f86\u5b58\u5411\u91cf\u8cc7\u6599\uff0c\u9019\u4e0a\u9762\u6709\u5169\u500b tables \u5206\u5225\u662f:<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>paragraphs table \u5b58 context \u6bb5\u843d\uff0c\u6b04\u4f4d\u6709\n<ul class=\"wp-block-list\">\n<li>id<\/li>\n\n\n\n<li>embedding \u5411\u91cf<\/li>\n\n\n\n<li>model \u662f\u54ea\u4e00\u7a2e\u6a21\u578b<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>questions table \u5b58\u554f\u984c\uff0c\u6b04\u4f4d\u6709\n<ul class=\"wp-block-list\">\n<li>embedding \u5411\u91cf<\/li>\n\n\n\n<li>paragraph_id \u5c0d\u61c9\u7684\u6a19\u6e96 paragraph ID \u662f\u54ea\u4e00\u500b<\/li>\n\n\n\n<li>model \u662f\u54ea\u4e00\u7a2e\u6a21\u578b<\/li>\n<\/ul>\n<\/li>\n<\/ul>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u7a0b\u5f0f\u6709\u5169\u96bb\n<ul class=\"wp-block-list\">\n<li>indexing-{provider}.py \u8655\u7406\u8f49\u6210\u5411\u91cf\uff0c\u5b58\u5230 supabase \u8cc7\u6599\u5eab<\/li>\n\n\n\n<li>benchmark.py \u5f9e supabase \u53d6\u51fa\u67d0\u6a21\u578b\u7684\u5168\u90e8\u8cc7\u6599\uff0c\u6bcf\u500b\u554f\u984c\u8ddf paragraphs \u53bb\u8a08\u7b97\u76f8\u4f3c\u5ea6\uff0c\u6488\u51fa top-5 \u7136\u5f8c\u8a08\u7b97\u5e73\u5747\u5206\u6578<\/li>\n<\/ul>\n<\/li>\n<\/ul>\n\n\n\n<p>\u4f46\u6211\u6c92\u6709\u7528 pgvector \u505a\u76f8\u4f3c\u5ea6\u641c\u5c0b\uff0c\u4e00\u4f86\u662f\u70ba\u4e86\u907f\u514d\u5411\u91cf\u8cc7\u6599\u5eab\u7684 ANN \u7b97\u6cd5\u6709\u4efb\u4f55\u8aa4\u5dee\uff0c\u4e8c\u4f86\u6578\u64da\u91cf\u4e5f\u4e0d\u7b97\u662f\u975e\u5e38\u591a\uff0c\u65bc\u662f\u5c31\u5728\u672c\u6a5f\u9010\u7b46\u7b97 cosine \u76f8\u4f3c\u5ea6\u4e86\uff0c\u4e00\u500b\u6a21\u578b\u4e5f\u5c31\u662f 3493 x 1000 = 349.3 \u842c\u6b21 \u5411\u91cf\u8a08\u7b97\uff0c\u4ee5\u4e00\u53f0 MBP m2 pro \u98a8\u6247\u8f49\u4e00\u8f49\u9084\u662f\u6c92\u554f\u984c\u7684\u3002<\/p>\n\n\n\n<p>\u6240\u6709\u8a55\u6e2c\u7684\u958b\u6e90\u6a21\u578b\u90fd\u662f\u7528 <a href=\"https:\/\/sbert.net\/\">SentenceTransformers<\/a> \u5957\u4ef6\u5f9e HugguingFace \u4e0a\u4e0b\u8f09\u6a21\u578b\u56de\u4f86\uff0c\u5728\u6211\u672c\u6a5f MBP \u96fb\u8166\u4e0a\u8dd1\u8f49\u5411\u91cf\u7684\u3002\u9664\u4e86 Qwen2-1.5B \u6a21\u578b\u56e0\u70ba\u6bd4\u8f03\u5927\uff0c\u4e14\u9700\u8981 CUDA \u662f\u5728 Google Colab \u958b GPU \u8dd1\u7684\uff0c\u81f3\u65bc Qwen2-7B \u5728\u514d\u8cbb\u7248 Google Colab \u4e5f\u8dd1\u4e0d\u52d5\uff0c\u5c31\u653e\u68c4\u4e86\u3002\u9019\u5169\u500b Qwen2 \u6a21\u578b\u652f\u63f4\u5230 32000 tokens \u8f38\u5165\uff0c\u56e0\u6b64\u9700\u8981\u6bd4\u8f03\u591a\u7684\u904b\u7b97\u8cc7\u6e90\u8ddf\u8a18\u61b6\u9ad4\u3002<\/p>\n\n\n\n<p>\u53e6\u5916\u6709\u4e9b\u6a21\u578b\u7684\u6700\u5927\u8f38\u5165 tokens \u53ea\u6709 512 tokens\uff0c\u5982\u679c\u8d85\u904e\u6703\u81ea\u52d5\u622a\u65b7\u53ea\u53d6\u524d\u9762 512 tokens \u8f49\u6210\u5411\u91cf\u3002\u5728\u672c\u8cc7\u6599\u96c6\u4e2d\uff0c\u554f\u984c\u5b57\u4e32\u9577\u5ea6\u78ba\u5be6\u90fd\u5728 512 tokens \u4ee5\u4e0b\uff0c\u4f46\u662f\u6bb5\u843d contexts \u5247\u6709\u90e8\u5206\u8d85\u904e\uff0c\u5927\u7d04\u6709 10% \u5de6\u53f3\u7684\u6bb5\u843d\u6587\u5b57\uff0c\u843d\u5728 512~800 tokens \u4e4b\u9593\u3002\u9019\u90e8\u5206\u5404\u5bb6 tokenizer \u4e0d\u592a\u4e00\u6a23\u6240\u4ee5 tokens \u6578\u4e5f\u4e0d\u592a\u4e00\u6a23\u3002\u7e3d\u4e4b\u5c0d\u65bc\u4e0a\u9650\u662f 512 tokens \u7684\u6a21\u578b\uff0c\u9019\u500b\u8a55\u4f30\u7d50\u679c\u6703\u6709\u4e9b\u8a31\u8aa4\u5dee(\u61c9\u8a72\u662f\u4f4e\u4f30\uff0c\u5be6\u969b\u6703\u66f4\u9ad8\u5206)\uff0c\u4e0d\u904e\u5982\u540c\u6211\u4e0a\u9762\u8aaa\u7684\uff0c\u5728 RAG \u5834\u666f\u4e2d\uff0c\u6050\u6015\u662f\u4e0d\u6703\u9078\u64c7\u4e0a\u9650\u53ea\u6709 512 tokens \u7684\u6a21\u578b\u4f86\u7528\u4e86\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">FAQ<\/h3>\n\n\n\n<p>Q: \u540c\u4e00\u500b\u61c9\u7528\u7684 Embedding \u6a21\u578b\u8ddf LLM \u6a21\u578b\u53ef\u4ee5\u4e0d\u540c\u5bb6\u5ee0\u5546\u55ce?<br>A: \u53ef\u4ee5\u7684\uff0c\u5169\u8005\u5728\u4f7f\u7528\u4e0a\u6c92\u95dc\u4fc2\u3002Embedding \u6a21\u578b\u53ea\u7528\u65bc\u6aa2\u7d22\u627e\u76f8\u4f3c\u5411\u91cf\uff0c\u627e\u5230\u5411\u91cf\u5c0d\u61c9\u7684\u6587\u5b57\u5f8c\uff0c\u6587\u5b57\u585e\u9032 prompt \u7d66 LLM \u751f\u6210\u7b54\u6848\u7d66\u7528\u6236\u3002\u6240\u4ee5\u5169\u8005\u5728\u4f7f\u7528\u4e0a\u7121\u95dc\u3002<\/p>\n\n\n\n<p>Q: \u4e0d\u540c Embedding \u6a21\u578b\u7684\u5411\u91cf\u76f8\u901a\u55ce?<br>A: \u90fd\u4e0d\u76f8\u901a\uff0c\u5305\u62ec\u540c\u4e00\u5bb6\u51fa\u7684\u4e0d\u540c\u4ee3\u6a21\u578b\u4e5f\u4e0d\u76f8\u901a\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">\u672a\u4f86\u5c55\u671b<\/h3>\n\n\n\n<p>\u9032\u4e00\u6b65\u8a55\u6e2c Reranker \u6a21\u578b: \u6211\u5011\u53ef\u52a0\u4e0a Reranker \u505a\u4e8c\u968e\u6bb5\u6aa2\u7d22\uff0c\u4f8b\u5982\u7b2c\u4e00\u968e\u6bb5\u628a top-k \u6539 10\uff0c\u7136\u5f8c\u7b2c\u4e8c\u968e\u6bb5\u4f7f\u7528 Reranker \u5f9e\u4e2d\u53d6\u524d 5 \u9019\u6a23\u3002\u5982\u6b64\u53ef\u4ee5\u9032\u4e00\u6b65\u63d0\u5347 Hit Rate \u548c MRR \u5206\u6578\u3002<\/p>\n\n\n\n<p>Updated(2024\/7\/14): \u4e0b\u96c6\u4f86\u4e86\uff0c\u8acb\u898b <a href=\"https:\/\/ihower.tw\/blog\/archives\/12227\">\u4f7f\u7528\u7e41\u9ad4\u4e2d\u6587\u8a55\u6e2c\u5404\u5bb6 Reranker \u6a21\u578b\u7684\u91cd\u6392\u80fd\u529b<\/a><\/p>\n\n\n\n<p>&#8212;<\/p>\n\n\n\n<blockquote class=\"wp-block-quote is-layout-flow wp-block-quote-is-layout-flow\">\n<p><a href=\"https:\/\/www.facebook.com\/ihower\/posts\/10161211885018971\">\u6b64\u8a55\u6e2c Facebook \u8cbc\u6587\u8a0e\u8ad6 \u50b3\u9001\u9580 \u2197\ufe0f<\/a> (\u6b61\u8fce\u6309\u8b9a\u3001\u8ffd\u8e64\u3001\u5206\u4eab)<\/p>\n<\/blockquote>\n\n\n\n<blockquote class=\"wp-block-quote is-layout-flow wp-block-quote-is-layout-flow\">\n<p><a href=\"https:\/\/ihower.tw\/opt-in\/gai\">\u6b61\u8fce\u8a02\u95b1 \ud83d\udcec<\/a>&nbsp;\u611b\u597d AI Engineer \u96fb\u5b50\u5831&nbsp;<a href=\"https:\/\/ihower.tw\/blog\/archives\/category\/aie\">\u904e\u5f80\u671f\u6578\u9ede\u9019<\/a>&nbsp;\ud83d\udcda<\/p>\n<\/blockquote>\n","protected":false},"excerpt":{"rendered":"<p>\u60f3\u7cfb\u7d71\u6027\u5b78\u7fd2\u5982\u4f55\u6253\u9020 LLM\u3001RAG \u548c Agents \u61c9\u7528\u55ce? \u6b61\u8fce\u5831\u540d\u6211\u7684\u8ab2\u7a0b&nbsp;\u5927\u8a9e\u8a00\u6a21\u578b LL &hellip; <\/p>\n<p class=\"link-more\"><a href=\"https:\/\/ihower.tw\/blog\/12167-embedding-models\" class=\"more-link\">\u95b1\u8b80\u5168\u6587<span class=\"screen-reader-text\">\u3008\u4f7f\u7528\u7e41\u9ad4\u4e2d\u6587\u8a55\u6e2c\u5404\u5bb6 Embedding \u6a21\u578b\u7684\u6aa2\u7d22\u80fd\u529b\u3009<\/span><\/a><\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"_monsterinsights_skip_tracking":false,"_monsterinsights_sitenote_active":false,"_monsterinsights_sitenote_note":"","_monsterinsights_sitenote_category":0,"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":true,"jetpack_social_options":{"image_generator_settings":{"template":"highway","default_image_id":0,"font":"","enabled":false},"version":2}},"categories":[80],"tags":[],"class_list":["post-12167","post","type-post","status-publish","format-standard","hentry","category-llm","entry"],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_shortlink":"https:\/\/wp.me\/p1q6tG-3af","jetpack_sharing_enabled":true,"jetpack_likes_enabled":true,"_links":{"self":[{"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/posts\/12167","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/comments?post=12167"}],"version-history":[{"count":73,"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/posts\/12167\/revisions"}],"predecessor-version":[{"id":13264,"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/posts\/12167\/revisions\/13264"}],"wp:attachment":[{"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/media?parent=12167"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/categories?post=12167"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/ihower.tw\/blog\/wp-json\/wp\/v2\/tags?post=12167"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}