
{"id":3801,"date":"2024-12-10T22:40:08","date_gmt":"2024-12-10T14:40:08","guid":{"rendered":"https:\/\/infernews.com\/?page_id=3801"},"modified":"2025-02-20T23:31:12","modified_gmt":"2025-02-20T15:31:12","slug":"%e4%bd%95%e8%ac%82-text-embedding","status":"publish","type":"page","link":"https:\/\/infernews.com\/blog\/%e4%bd%95%e8%ac%82-text-embedding\/","title":{"rendered":"\u4f55\u8b02 Text Embedding"},"content":{"rendered":"<p>Text Embedding\uff08\u6587\u672c\u5d4c\u5165\uff09\u662f\u4e00\u7a2e\u81ea\u7136\u8a9e\u8a00\u8655\u7406\u6280\u8853\uff0c\u7528\u65bc\u5c07\u6587\u672c\u8f49\u63db\u6210\u6578\u503c\u5411\u91cf\uff0c\u4fdd\u7559\u5176\u539f\u59cb\u6587\u672c\u7684\u610f\u7fa9\u548c\u7d50\u69cb\u3002\u9019\u4e9b\u5411\u91cf\u88ab\u7a31\u70baEmbeddings\uff0c\u5b83\u5011\u53ef\u4ee5\u7528\u65bc\u8a31\u591aNLP\u4efb\u52d9\uff0c\u5982\u6587\u672c\u985e\u4f3c\u5ea6\u8a08\u7b97\u3001\u6587\u672c\u751f\u6210\u3001\u6587\u672c\u5206\u985e\u7b49\u3002 Text Embedding\u7684\u76ee\u6a19\u662f\u5c07\u6587\u672c\u8f49\u63db\u6210\u4e00\u7a2e\u53ef\u6578\u5b78\u5316\u7684\u5f62\u5f0f\uff0c\u4f7f\u5f97\u5b83\u5011\u80fd\u5920\u8207\u5176\u4ed6\u6578\u503c\u5411\u91cf\u9032\u884c\u6bd4\u8f03\u548c\u904b\u7b97\u3002\u9019\u6a23\u53ef\u4ee5\u8b93\u6a21\u578b\u5728\u8655\u7406\u6587\u672c\u6642\uff0c\u80fd\u5920\u5229\u7528\u50b3\u7d71\u7684\u795e\u7d93\u7db2\u8def\u6280\u8853\u4f86\u9032\u884c\u5206\u6790\u548c\u9810\u6e2c\u3002 \u5e38\u898b\u7684Text Embedding\u65b9\u6cd5\u5305\u62ec\uff1a Word2Vec\uff1a\u662f\u4e00\u7a2e\u7528\u65bc\u5c07\u55ae\u8a5e\u8f49\u63db\u6210\u6578\u503c\u5411\u91cf\u7684\u65b9\u6cd5\uff0c\u5b83\u901a\u904e\u8a13\u7df4Word Embeddings\u6a21\u578b\u4f86\u7372\u5f97\u6bcf\u500b\u55ae\u8a5e\u7684\u5411\u91cf\u8868\u9054\u3002 GloVe\uff1a\u662f\u4e00\u7a2e\u57fa\u65bc\u77e9\u9663\u5206\u89e3\u7684\u65b9\u6cd5\uff0c\u65e8\u5728\u7372\u53d6\u6bcf\u500b\u55ae\u8a5e\u7684\u5411\u91cf\u8868\u9054\uff0c\u4e26\u5229\u7528\u6587\u672c\u4e2d\u55ae\u8a5e\u4e4b\u9593\u7684\u95dc\u806f\u4fe1\u606f\u4f86\u9032\u884c\u5b78\u7fd2\u3002 BERT\uff08Bidirectional Encoder Representations from Transformers\uff09\uff1a\u662f\u4e00\u7a2e\u57fa\u65bctransformer\u67b6\u69cb\u7684\u9810\u8a13\u7df4\u6a21\u578b\uff0c\u5b83\u901a\u904e\u5c07\u6587\u672c\u8f49\u63db\u6210\u5411\u91cf\u8868\u9054\uff0c\u4e26\u4e14\u80fd\u5920\u6355\u6349\u5230\u6587\u672c\u4e2d\u7684\u9577\u8ddd\u96e2\u4f9d\u8cf4\u95dc\u4fc2\u3002 Text Embedding\u6709\u8a31\u591a\u61c9\u7528\uff0c\u5305\u62ec\uff1a \u6587\u672c\u985e\u4f3c\u5ea6\u8a08\u7b97\uff1a\u4f7f\u7528Embeddings\u53ef\u4ee5\u6bd4\u8f03\u5169\u500b\u6587\u672c\u7684\u76f8\u4f3c\u7a0b\u5ea6\u3002 \u6587\u672c\u5206\u985e\uff1a\u901a\u904e\u5c07\u6587\u672c\u8f49\u63db\u6210\u5411\u91cf\u8868\u9054\uff0c\u53ef\u4ee5\u9032\u884c\u6587\u672c\u5206\u985e\u7b49NLP\u4efb\u52d9\u3002 \u6587\u672c\u751f\u6210\uff1a Embeddings\u53ef\u4ee5\u7528\u65bc\u751f\u6210\u65b0\u7684\u6587\u672c\uff0c\u4f8b\u5982\u6587\u672c\u6458\u8981\u6216\u6587\u672c\u5b8c\u6210\u3002 4.\u63a8\u85a6\u7cfb\u7d71\uff1a\u4f7f\u7528Embeddings\u53ef\u4ee5\u5efa\u69cb\u51fa\u57fa\u65bc\u6587\u672c\u7684\u63a8\u85a6\u7cfb\u7d71\u3002<\/p>\n<p>\u00a0<\/p>\n\n\n<figure class=\"wp-block-embed is-type-video is-provider-youtube wp-block-embed-youtube wp-embed-aspect-16-9 wp-has-aspect-ratio\"><div class=\"wp-block-embed__wrapper\">\n<div class=\"lyte-wrapper\" title=\"How word vectors encode meaning\" style=\"width:853px;max-width:100%;margin:5px auto;\"><div class=\"lyMe\" id=\"WYL_FJtFZwbvkI4\" itemprop=\"video\" itemscope itemtype=\"https:\/\/schema.org\/VideoObject\"><div><meta itemprop=\"thumbnailUrl\" content=\"https:\/\/infernews.com\/blog\/wp-content\/plugins\/wp-youtube-lyte\/lyteCache.php?origThumbUrl=https%3A%2F%2Fi.ytimg.com%2Fvi%2FFJtFZwbvkI4%2Fhqdefault.jpg\" \/><meta itemprop=\"embedURL\" content=\"https:\/\/www.youtube.com\/embed\/FJtFZwbvkI4\" \/><meta itemprop=\"duration\" content=\"PT1M\" \/><meta itemprop=\"uploadDate\" content=\"2024-04-11T16:23:26Z\" \/><\/div><meta itemprop=\"accessibilityFeature\" content=\"captions\" \/><div id=\"lyte_FJtFZwbvkI4\" data-src=\"https:\/\/infernews.com\/blog\/wp-content\/plugins\/wp-youtube-lyte\/lyteCache.php?origThumbUrl=https%3A%2F%2Fi.ytimg.com%2Fvi%2FFJtFZwbvkI4%2Fhqdefault.jpg\" class=\"pL\"><div class=\"tC\"><div class=\"tT\" itemprop=\"name\">How word vectors encode meaning<\/div><\/div><div class=\"play\"><\/div><div class=\"ctrl\"><div class=\"Lctrl\"><\/div><div class=\"Rctrl\"><\/div><\/div><\/div><noscript><a href=\"https:\/\/youtu.be\/FJtFZwbvkI4\" rel=\"nofollow\"><img loading=\"lazy\" decoding=\"async\" src=\"https:\/\/infernews.com\/blog\/wp-content\/plugins\/wp-youtube-lyte\/lyteCache.php?origThumbUrl=https%3A%2F%2Fi.ytimg.com%2Fvi%2FFJtFZwbvkI4%2F0.jpg\" alt=\"How word vectors encode meaning\" width=\"853\" height=\"460\" \/><br \/>Watch this video on YouTube<\/a><\/noscript><meta itemprop=\"description\" content=\"This comes from a full video dissecting how LLMs work. In the shorts player, you can click the link at the bottom of the screen, or for reference: https:\/\/youtu.be\/wjZofJX0v4M\"><\/div><\/div><div class=\"lL\" style=\"max-width:100%;width:853px;margin:5px auto;\"><\/div>\n<\/div><\/figure>\n","protected":false},"excerpt":{"rendered":"<p>Text Embedding\uff08\u6587\u672c\u5d4c\u5165\uff09\u662f\u4e00\u7a2e\u81ea\u7136\u8a9e\u8a00\u8655\u7406\u6280\u8853\uff0c\u7528\u65bc\u5c07\u6587\u672c\u8f49\u63db\u6210\u6578\u503c\u5411\u91cf\uff0c\u4fdd\u7559\u5176\u539f\u59cb\u6587\u672c\u7684\u610f\u7fa9\u548c\u7d50\u69cb\u3002\u9019\u4e9b\u5411\u91cf\u88ab\u7a31\u70baEmbeddings\uff0c\u5b83\u5011\u53ef\u4ee5\u7528\u65bc\u8a31\u591aNLP\u4efb\u52d9\uff0c\u5982\u6587\u672c\u985e\u4f3c\u5ea6\u8a08\u7b97\u3001\u6587\u672c\u751f\u6210\u3001\u6587\u672c\u5206\u985e\u7b49\u3002 Text Embedding\u7684\u76ee\u6a19\u662f\u5c07\u6587\u672c\u8f49\u63db\u6210\u4e00\u7a2e\u53ef\u6578\u5b78\u5316\u7684\u5f62\u5f0f\uff0c\u4f7f\u5f97\u5b83\u5011\u80fd\u5920\u8207\u5176\u4ed6\u6578\u503c\u5411\u91cf\u9032\u884c\u6bd4\u8f03\u548c\u904b\u7b97\u3002\u9019\u6a23\u53ef\u4ee5\u8b93\u6a21\u578b\u5728\u8655\u7406\u6587\u672c\u6642\uff0c\u80fd\u5920\u5229\u7528\u50b3\u7d71\u7684\u795e\u7d93\u7db2\u8def\u6280\u8853\u4f86\u9032\u884c\u5206\u6790\u548c\u9810\u6e2c\u3002 \u5e38\u898b\u7684Text Embedding\u65b9\u6cd5\u5305\u62ec\uff1a Word2Vec\uff1a\u662f\u4e00\u7a2e\u7528\u65bc\u5c07\u55ae\u8a5e\u8f49\u63db\u6210\u6578\u503c\u5411\u91cf\u7684\u65b9\u6cd5\uff0c\u5b83\u901a\u904e\u8a13\u7df4Word Embeddings\u6a21\u578b\u4f86\u7372\u5f97\u6bcf\u500b\u55ae\u8a5e\u7684\u5411\u91cf\u8868\u9054\u3002 GloVe\uff1a\u662f\u4e00\u7a2e\u57fa\u65bc\u77e9\u9663\u5206\u89e3\u7684\u65b9\u6cd5\uff0c\u65e8\u5728\u7372\u53d6\u6bcf\u500b\u55ae\u8a5e\u7684\u5411\u91cf\u8868\u9054\uff0c\u4e26\u5229\u7528\u6587\u672c\u4e2d\u55ae\u8a5e\u4e4b\u9593\u7684\u95dc\u806f\u4fe1\u606f\u4f86\u9032\u884c\u5b78\u7fd2\u3002 BERT\uff08Bidirectional Encoder Representations from Transformers\uff09\uff1a\u662f\u4e00\u7a2e\u57fa\u65bctransformer\u67b6\u69cb\u7684\u9810\u8a13\u7df4\u6a21\u578b\uff0c\u5b83\u901a\u904e\u5c07\u6587\u672c\u8f49\u63db\u6210\u5411\u91cf\u8868\u9054\uff0c\u4e26\u4e14\u80fd\u5920\u6355\u6349\u5230\u6587\u672c\u4e2d\u7684\u9577\u8ddd\u96e2\u4f9d\u8cf4\u95dc\u4fc2\u3002 Text Embedding\u6709\u8a31\u591a\u61c9\u7528\uff0c\u5305\u62ec\uff1a \u6587\u672c\u985e\u4f3c\u5ea6\u8a08\u7b97\uff1a\u4f7f\u7528Embeddings\u53ef\u4ee5\u6bd4\u8f03\u5169\u500b\u6587\u672c\u7684\u76f8\u4f3c\u7a0b\u5ea6\u3002 \u6587\u672c\u5206\u985e\uff1a\u901a\u904e\u5c07\u6587\u672c\u8f49\u63db\u6210\u5411\u91cf\u8868\u9054\uff0c\u53ef\u4ee5\u9032\u884c\u6587\u672c\u5206\u985e\u7b49NLP\u4efb\u52d9\u3002 \u6587\u672c\u751f\u6210\uff1a Embeddings\u53ef\u4ee5\u7528\u65bc\u751f\u6210\u65b0\u7684\u6587\u672c\uff0c\u4f8b\u5982\u6587\u672c\u6458\u8981\u6216\u6587\u672c\u5b8c\u6210\u3002 4.\u63a8\u85a6\u7cfb\u7d71\uff1a\u4f7f\u7528Embeddings\u53ef\u4ee5\u5efa\u69cb\u51fa\u57fa\u65bc\u6587\u672c\u7684\u63a8\u85a6\u7cfb\u7d71\u3002 \u00a0<\/p>\n","protected":false},"author":1,"featured_media":0,"parent":0,"menu_order":0,"comment_status":"closed","ping_status":"closed","template":"","meta":{"googlesitekit_rrm_CAowvqSiDA:productID":"","footnotes":""},"class_list":["post-3801","page","type-page","status-publish","hentry"],"_links":{"self":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/pages\/3801","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/pages"}],"about":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/types\/page"}],"author":[{"embeddable":true,"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/comments?post=3801"}],"version-history":[{"count":0,"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/pages\/3801\/revisions"}],"wp:attachment":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/media?parent=3801"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}