{"id":85,"date":"2025-04-01T17:35:07","date_gmt":"2025-04-01T09:35:07","guid":{"rendered":"https:\/\/knoka.vip\/?p=85"},"modified":"2025-04-04T11:07:16","modified_gmt":"2025-04-04T03:07:16","slug":"%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88","status":"publish","type":"post","link":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/","title":{"rendered":"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848"},"content":{"rendered":"\n<h2 class=\"wp-block-heading\">\u57fa\u7840\u4ecb\u7ecd<\/h2>\n\n\n\n<h3 class=\"wp-block-heading\">Ollama\u4ecb\u7ecd<\/h3>\n\n\n\n<p>\u8f7b\u91cf\u7ea7\u672c\u5730\u5316\u5de5\u5177\uff0c\u4e13\u4e3a\u4e2a\u4eba\u5f00\u53d1\u8005\u548c\u5c0f\u89c4\u6a21\u5b9e\u9a8c\u8bbe\u8ba1\uff0c\u4e3b\u6253\u5feb\u901f\u90e8\u7f72\u548c\u4f4e\u8d44\u6e90\u5360\u7528<\/p>\n\n\n\n<p><strong>\u6838\u5fc3\u4f18\u52bf<\/strong>\uff1a<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u4e00\u952e\u5b89\u88c5\uff0c\u652f\u6301\u8de8\u5e73\u53f0\uff08Windows\/macOS\/Linux\uff09\uff0c\u65e0\u9700\u7f16\u7a0b\u57fa\u7840\u5373\u53ef\u4f7f\u7528;<\/li>\n\n\n\n<li>\u5185\u7f6e1700+\u9884\u8bad\u7ec3\u6a21\u578b\uff0c\u81ea\u52a8\u4e0b\u8f7dint4\u91cf\u5316\u7248\u672c\uff0c\u663e\u5b58\u5360\u7528\u6781\u4f4e\uff08\u5982Qwen2.5-14B\u4ec5\u970011GB\u663e\u5b58\uff09;<\/li>\n\n\n\n<li>\u652f\u6301CPU\/GPU\u6df7\u5408\u8fd0\u884c\uff0c\u7a7a\u95f2\u65f6\u81ea\u52a8\u91ca\u653e\u663e\u5b58\uff0c\u9002\u5408\u4f4e\u914d\u7f6e\u8bbe\u5907\uff08\u598216GB\u5185\u5b58\u7b14\u8bb0\u672c\uff09;<\/li>\n\n\n\n<li>\u63d0\u4f9b\u7c7bChatGPT\u7684\u4ea4\u4e92\u5f0f\u547d\u4ee4\u884c\u754c\u9762\uff0c\u9002\u5408\u5feb\u901f\u6d4b\u8bd5\u548c\u539f\u578b\u5f00\u53d1;<\/li>\n<\/ul>\n\n\n\n<p><strong>\u5c40\u9650\u6027\uff1a<\/strong><\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u5e76\u53d1\u529b\u5f31\uff08\u5355\u6b21\u8bf7\u6c42\u54cd\u5e94\u5feb\uff0c\u4f46\u541e\u5410\u91cf\u4f4e\uff09\uff0c\u65e0\u6cd5\u5904\u7406\u9ad8\u5e76\u53d1\u4efb\u52a1\uff1b<\/li>\n\n\n\n<li>\u91cf\u5316\u6a21\u578b\u53ef\u80fd\u964d\u4f4e\u751f\u6210\u8d28\u91cf\uff08\u5982\u903b\u8f91\u4e25\u8c28\u6027\u6216\u521b\u610f\u6027\u4e0b\u964d\uff09\uff1b<\/li>\n<\/ul>\n\n\n\n<h3 class=\"wp-block-heading\">VLLM\u4ecb\u7ecd<\/h3>\n\n\n\n<p>\u751f\u4ea7\u7ea7\u63a8\u7406\u6846\u67b6\uff0c\u4e13\u6ce8\u4f01\u4e1a\u7ea7\u9ad8\u5e76\u53d1\u573a\u666f\uff0c\u5f3a\u8c03\u541e\u5410\u91cf\u548c\u7a33\u5b9a\u6027<\/p>\n\n\n\n<p><strong>\u6838\u5fc3\u4f18\u52bf<\/strong>\uff1a<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u57fa\u4e8ePagedAttention\u6280\u672f\u4f18\u5316\u663e\u5b58\u7ba1\u7406\uff0c\u652f\u6301\u52a8\u6001\u6279\u5904\u7406\uff0c\u5343\u7ea7\u5e76\u53d1\u541e\u5410\u91cf\u662fOllama\u768424\u500d\uff1b<\/li>\n\n\n\n<li>\u4f7f\u7528\u539f\u59cbFP16\/BF16\u6a21\u578b\uff0c\u751f\u6210\u8d28\u91cf\u9ad8\uff0c\u652f\u6301HuggingFace\u683c\u5f0f\u6a21\u578b\u548c\u5206\u5e03\u5f0f\u90e8\u7f72\uff1b<\/li>\n\n\n\n<li>\u517c\u5bb9OpenAI API\u63a5\u53e3\uff0c\u53ef\u76f4\u63a5\u66ff\u6362\u4f01\u4e1a\u73b0\u6709AI\u670d\u52a1\uff0c\u65e0\u7f1d\u96c6\u6210\u4e1a\u52a1\u7cfb\u7edf\uff1b<\/li>\n<\/ul>\n\n\n\n<p><strong>\u5c40\u9650\u6027<\/strong>\uff1a<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u5fc5\u987b\u4f9d\u8d56NVIDIA GPU\uff08\u5982A100\/H100\uff09\uff0c\u663e\u5b58\u5360\u7528\u9ad8\uff1b<\/li>\n\n\n\n<li>\u90e8\u7f72\u76f8\u5bf9\u590d\u6742\uff0c\u9700\u624b\u52a8\u914d\u7f6ePython\/CUDA\u73af\u5883\uff0c\u6280\u672f\u95e8\u69db\u8f83\u9ad8\uff1b<\/li>\n<\/ul>\n\n\n\n<h3 class=\"wp-block-heading\">\u4e8c\u8005\u5bf9\u6bd4<\/h3>\n\n\n\n<p>Ollama\u662f\u201c\u4e2a\u4eba\u5b9e\u9a8c\u5229\u5668\u201d\uff0cvLLM\u662f\u201c\u4f01\u4e1a\u751f\u4ea7\u5f15\u64ce\u201d\u3002\u82e5\u9700\u517c\u987e\u4e24\u8005\uff0c\u53ef\u5148\u7528Ollama\u672c\u5730\u9a8c\u8bc1\u6a21\u578b\uff0c\u518d\u7528vLLM\u90e8\u7f72\u751f\u4ea7\u73af\u5883\u3002<\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th class=\"has-text-align-center\" data-align=\"center\"><strong>\u5bf9\u6bd4\u7ef4\u5ea6<\/strong><\/th><th class=\"has-text-align-center\" data-align=\"center\"><strong>Ollama<\/strong><\/th><th class=\"has-text-align-center\" data-align=\"center\"><strong>vLLM<\/strong><\/th><\/tr><\/thead><tbody><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u6838\u5fc3\u573a\u666f<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u4e2a\u4eba\u5b66\u4e60\u3001\u672c\u5730\u6d4b\u8bd5<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u4f01\u4e1a\u7ea7API\u670d\u52a1\u3001\u9ad8\u5e76\u53d1\u63a8\u7406<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u786c\u4ef6\u8981\u6c42<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">CPU\u53ef\u7528\uff0cGPU\u53ef\u9009<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u5fc5\u987bNVIDIA GPU<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u663e\u5b58\u5360\u7528<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6781\u4f4e\uff08\u91cf\u5316\u6a21\u578b\u6709\u538b\u7f29\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6781\u9ad8\uff08\u539f\u59cb\u6a21\u578b\u5360\u7528\u5b8c\u6574\u663e\u5b58\uff09<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u5355\u6b21\u63a8\u7406\u901f\u5ea6<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u66f4\u5feb\uff08Qwen2.5-7B\u7ea63\u79d2\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u7a0d\u6162\uff08Qwen2.5-7B\u7ea63.5-4.3\u79d2\uff09<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u5e76\u53d1\u541e\u5410\u91cf<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u4f4e\uff08\u5355\u7ebf\u7a0b\u4e3a\u4e3b\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6781\u9ad8\uff08\u52a8\u6001\u6279\u5904\u7406\uff0c\u652f\u6301\u5e76\u53d1\uff09<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u6a21\u578b\u652f\u6301<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u5185\u7f6e1700+\u91cf\u5316\u6a21\u578b\uff0c\u5f00\u7bb1\u5373\u7528<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u624b\u52a8\u4e0b\u8f7d\u539f\u59cb\u6a21\u578b<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u90e8\u7f72\u96be\u5ea6<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u4e00\u952e\u5b89\u88c5\uff0c\u65e0\u9700\u6280\u672f\u80cc\u666f<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u914d\u7f6e\u73af\u5883\uff0c\u4f9d\u8d56\u7ecf\u9a8c<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u4ea4\u4e92\u65b9\u5f0f<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u547d\u4ee4\u884c\u5bf9\u8bdd\u754c\u9762<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u4ec5API\u8c03\u7528\uff08\u65e0\u4ea4\u4e92\u754c\u9762\uff09<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u6269\u5c55\u6027<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u5355\u673a\u90e8\u7f72\uff0c\u591aGPU\u652f\u6301\u6709\u9650<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u652f\u6301\u5206\u5e03\u5f0f\u90e8\u7f72\u3001\u591aGPU\u5e76\u884c<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u5178\u578b\u7528\u9014<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u5199\u4ee3\u7801\u3001\u7ffb\u8bd1\u3001\u751f\u6210\u6587\u6848<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6784\u5efa\u667a\u80fd\u5ba2\u670d\u3001\u6279\u91cf\u6570\u636e\u5206\u6790<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\"><strong>\u8d44\u6e90\u7ba1\u7406<\/strong><\/td><td class=\"has-text-align-center\" data-align=\"center\">\u7a7a\u95f2\u65f6\u91ca\u653e\u663e\u5b58\uff0c\u52a8\u6001\u8c03\u6574\u8d44\u6e90<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u663e\u5b58\u56fa\u5b9a\u5206\u914d\uff0c\u9700\u9884\u7559\u5cf0\u503c\u8d44\u6e90<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">\u73af\u5883\u51c6\u5907<\/h2>\n\n\n\n<p>\u5927\u6a21\u578b\u90e8\u7f72\u6240\u9700\u8981\u7684\u7b97\u529b\u4e00\u822c\u6bd4\u8f83\u9ad8\uff0c\u6211\u4eec\u9700\u8981\u6839\u636e\u81ea\u5df1\u6240\u90e8\u7f72\u7684\u6a21\u578b\u8fdb\u884c\u73af\u5883\u7684\u51c6\u5907\uff0c\u672c\u6b21\u6211\u4eec\u9009\u62e9\u7684\u6a21\u578b\u662fDeepSeek-R1-Distill-Qwen-32B-AWQ\u91cf\u5316\u7248\u672c\uff0c\u4e24\u5f20A100 40G\u5361\u8db3\u591f<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"808\" height=\"447\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-86\"  sizes=\"auto, (max-width: 808px) 100vw, 808px\" \/><\/div><\/figure>\n\n\n\n<p>\u8fd9\u91cc\u6211\u9009\u62e9\u7528\u4e24\u5f20A100 40G\u8fdb\u884c\u6a21\u578b\u7684\u90e8\u7f72\uff0c\u901a\u8fc7nvitop\u53ef\u4ee5\u5b9e\u73b0\u5b9e\u65f6\u67e5\u770b\u8bbe\u5907\u7684\u914d\u7f6e\u4fe1\u606f\u53d8\u5316<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-4-1024x266.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"266\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-4-1024x266.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-94\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">\u73af\u5883\u914d\u7f6e<\/h2>\n\n\n\n<p>\u4f7f\u7528VLLM\u90e8\u7f72\u6a21\u578b\uff0c\u90a3\u4e48\u9996\u5148\u5c31\u662f\u8981\u5b89\u88c5VLLM\uff0c\u8fd9\u91cc\u5b89\u88c5\u53ef\u76f4\u63a5\u4f7f\u7528pip<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>pip install vllm -i https:\/\/repo.huaweicloud.com\/repository\/pypi\/simple<\/code><\/pre>\n\n\n\n<p>\u4e4b\u540e\u5c31\u662f\u914d\u7f6e\u6a21\u578b\u4e0b\u8f7d\u529f\u80fd\uff0c\u8fd9\u91cc\u6211\u4eec\u53ef\u4ee5\u4eceModelScope\u5e73\u53f0\u8fdb\u884c\u6a21\u578b\u7684\u4e0b\u8f7d\uff0c\u4e5f\u53ef\u4ee5\u4ecehugging face\u8fdb\u884c\u6a21\u578b\u4e0b\u8f7d\uff0c\u76f8\u5bf9\u5e94\u7684\uff0c\u9009\u62e9\u54ea\u4e2a\u5e73\u53f0\u5c31\u8981\u914d\u7f6e\u90a3\u4e2a\u5e73\u53f0\u7684\u4e0b\u8f7d\u529f\u80fd\uff0c\u8fd9\u91cc\u6211\u4eec\u9009\u62e9ModelScope<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>pip install modelscope -i https:\/\/repo.huaweicloud.com\/repository\/pypi\/simple<\/code><\/pre>\n\n\n\n<h2 class=\"wp-block-heading\">\u6a21\u578b\u9009\u62e9<\/h2>\n\n\n\n<p>\u524d\u9762\u5df2\u7ecf\u914d\u7f6e\u597d\u6211\u4eec\u7684\u6a21\u578b\u4e0b\u8f7d\u670d\u52a1\uff0c\u90a3\u4e48\u63a5\u4e0b\u6765\u5c31\u662f\u8981\u8fdb\u884c\u6a21\u578b\u7684\u4e0b\u8f7d\uff0c\u53ef\u4ee5\u5148\u5728ModelScope\u5e73\u53f0\u8fdb\u884c\u6a21\u578b\u7684\u67e5\u627e\uff1ahttps:\/\/modelscope.cn\/models<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-2-1024x493.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"493\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-2-1024x493.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-88\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<p>\u4e0b\u8f7d\u6307\u4ee4\u5982\u4e0b\uff0c\u8fd9\u91cc\u6211\u53ea\u7528\u4e86\u4e24\u5f20A100\uff0c\u56e0\u6b64\u4e3a\u4fdd\u8bc1\u5bf9\u8bdd\u957f\u5ea6\uff0c\u9009\u62e9\u4f7f\u7528AWQ\u91cf\u5316\u7248\u672c<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>modelscope download --model Valdemardi\/DeepSeek-R1-Distill-Qwen-32B-AWQ --local_dir .\/DeepSeek-R1-Distill-Qwen-32B\n# modelscope download deepseek-ai\/DeepSeek-R1-Distill-Qwen-14B --local_dir .\/DeepSeek-R1-Distill-Qwen-14B\n# modelscope download --model Qwen\/QwQ-32B-AWQ --local_dir .\/QwQ-32B<\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-5-1024x261.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"261\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-5-1024x261.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-99\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">\u670d\u52a1\u542f\u52a8<\/h2>\n\n\n\n<h3 class=\"wp-block-heading\">\u5bf9\u8bdd\u6a21\u578b<\/h3>\n\n\n\n<h4 class=\"wp-block-heading\">\u6a21\u578b\u90e8\u7f72<\/h4>\n\n\n\n<p>\u542f\u52a8\u547d\u4ee4\u5982\u4e0b\uff0c\u6ce8\u610f\u5982\u679c\u4f60\u4f7f\u7528\u7684\u662fTesla V100-SXM2-32GB\u5361\u7684\u8bdd\uff0c\u56e0\u5176\u8ba1\u7b97\u80fd\u529b\uff08Compute Capability 7.0\uff09\u4e0d\u652f\u6301bfloat16\u6570\u636e\u7c7b\u578b\uff0c\u800cvLLM\u9ed8\u8ba4\u5c1d\u8bd5\u4f7f\u7528bfloat16\uff0c\u4f46\u8be5\u6570\u636e\u7c7b\u578b\u9700\u8981\u81f3\u5c11\u652f\u6301Compute Capability 8.0\u7684GPU\uff08\u5982A100\/A800\u7b49\uff09\uff0c\u56e0\u6b64\u9700<strong>\u4fee\u6539\u542f\u52a8\u53c2\u6570<\/strong>\uff0c\u663e\u5f0f\u6307\u5b9a\u4f7f\u7528float16\/half\u7cbe\u5ea6<\/p>\n\n\n\n<p>\u8fd9\u91cc\u6211\u7528\u7684\u5361\u662f\u53cc\u5361A100\uff0c\u53ef\u76f4\u63a5\u8fdb\u884c\u542f\u52a8\uff0cVLLM\u4f1a\u81ea\u52a8\u5224\u522b\u6a21\u578b\u662f\u4ec0\u4e48\u7c7b\u578b\u7684\uff0c\u5982\u662f\u5426\u4e3aAWQ\u91cf\u5316\uff0c\u56e0\u6b64\u8fd9\u91cc\u6211\u4eec\u65e0\u9700\u518d\u6b21\u6307\u5b9a\uff0c\u53c2\u6570\u4ecb\u7ecd\u5982\u4e0b\uff0c\u4e5f\u53ef\u53bb\u9605\u8bfb\u5b98\u65b9\u6587\u6863\uff1a<a href=\"https:\/\/docs.vllm.ai\/en\/latest\/serving\/engine_args.html\">Engine Arguments \u2014 vLLM<\/a><\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th class=\"has-text-align-center\" data-align=\"center\">\u53c2\u6570<\/th><th class=\"has-text-align-center\" data-align=\"center\">\u8bf4\u660e<\/th><th class=\"has-text-align-center\" data-align=\"center\">\u53ef\u9009\u503c\/\u793a\u4f8b<\/th><th class=\"has-text-align-center\" data-align=\"center\">\u5907\u6ce8<\/th><\/tr><\/thead><tbody><tr><td class=\"has-text-align-center\" data-align=\"center\">DeepSeek-R1-Distill-Qwen-32B<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u52a0\u8f7d\u7684\u6a21\u578b\u540d\u79f0<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u81ea\u5b9a\u4e49\u6a21\u578b\u8def\u5f84<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u786e\u4fdd\u6a21\u578b\u6587\u4ef6\u5b58\u5728\u4e14\u4e0evLLM\u517c\u5bb9<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;host 0.0.0.0<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u670d\u52a1\u5668\u76d1\u542c\u7684IP\u5730\u5740<\/td><td class=\"has-text-align-center\" data-align=\"center\">0.0.0.0\u6216127.0.0.1<\/td><td class=\"has-text-align-center\" data-align=\"center\">0.0.0.0\u5141\u8bb8\u5916\u90e8\u8bbf\u95ee<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;port 30041<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u670d\u52a1\u76d1\u542c\u7684\u7aef\u53e3\u53f7<\/td><td class=\"has-text-align-center\" data-align=\"center\">1-65535<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u786e\u4fdd\u7aef\u53e3\u672a\u88ab\u5360\u7528\u4e14\u6709\u8bbf\u95ee\u6743\u9650<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;uvicorn-log-level info<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u63a7\u5236Uvicorn\u670d\u52a1\u5668\u7684\u65e5\u5fd7\u7ea7\u522b<\/td><td class=\"has-text-align-center\" data-align=\"center\">debug,&nbsp;info,&nbsp;warning,&nbsp;error<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u8bbe\u7f6e\u4e3ainfo\u65f6\u8f93\u51fa\u57fa\u672c\u8fd0\u884c\u4fe1\u606f\uff0c\u8c03\u8bd5\u65f6\u53ef\u8bbe\u4e3adebug<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;pipeline-parallel-size 1<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6d41\u6c34\u7ebf\u5e76\u884c\u5ea6\uff08\u591aGPU\u95f4\u5c42\u62c6\u5206\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u22651<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u901a\u5e38\u4e3a1\uff08\u7981\u7528\u6d41\u6c34\u7ebf\u5e76\u884c\uff09\uff0c\u4ec5\u5f53\u6a21\u578b\u652f\u6301\u4e14GPU\u6570\u91cf\u8db3\u591f\u65f6\u8c03\u6574<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;tensor-parallel-size 4<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u5f20\u91cf\u5e76\u884c\u5ea6\uff08\u5355\u5c42\u5185\u53c2\u6570\u62c6\u5206\u5230\u591aGPU\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u22651<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u4e0e\u53ef\u7528GPU\u6570\u91cf\u5339\u914d\uff08\u5982\u8bbe\u7f6e\u4e3a4\u9700\u81f3\u5c114\u5757GPU\uff09<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;gpu-memory-utilization 0.9<\/td><td class=\"has-text-align-center\" data-align=\"center\">GPU\u663e\u5b58\u5229\u7528\u7387\u4e0a\u9650<\/td><td class=\"has-text-align-center\" data-align=\"center\">0.0-1.0<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u8bbe\u7f6e\u4e3a0.9\u65f6\u5141\u8bb8\u663e\u5b58\u5360\u7528\u4e0d\u8d85\u8fc790%\uff0c\u907f\u514dOOM\u9519\u8bef<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;device cuda<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6307\u5b9a\u8fd0\u884c\u8bbe\u5907<\/td><td class=\"has-text-align-center\" data-align=\"center\">cuda\uff08GPU\uff09\u6216cpu<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u5df2\u5b89\u88c5CUDA\u9a71\u52a8\u4e14\u786c\u4ef6\u652f\u6301<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;enable-prefix-caching<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u542f\u7528\u524d\u7f00\u7f13\u5b58\u52a0\u901f\u751f\u6210<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u65e0<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u5bf9\u91cd\u590d\u524d\u7f00\u7684\u8f93\u5165\uff08\u5982\u804a\u5929\u5386\u53f2\uff09\u53ef\u663e\u8457\u63d0\u5347\u63a8\u7406\u901f\u5ea6<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;trust-remote-code<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u4fe1\u4efb\u8fdc\u7a0b\u4ee3\u7801\uff08\u5982\u52a0\u8f7d\u81ea\u5b9a\u4e49\u6a21\u578b\u4ee3\u7801\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u65e0<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u52a0\u8f7dHuggingFace\u793e\u533a\u6a21\u578b\u65f6\u53ef\u80fd\u9700\u8981\u6b64\u53c2\u6570<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;max-model-len 65536<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6a21\u578b\u652f\u6301\u7684\u6700\u5927\u4e0a\u4e0b\u6587\u957f\u5ea6<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6839\u636e\u6a21\u578b\u548c\u786c\u4ef6\u8c03\u6574<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u8d85\u8fc7\u6a21\u578b\u539f\u751f\u652f\u6301\u957f\u5ea6\u65f6\u53ef\u80fd\u5f71\u54cd\u6548\u679c<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;api-key XnZ9qP7L&#8230;<\/td><td class=\"has-text-align-center\" data-align=\"center\">API\u8bbf\u95ee\u5bc6\u94a5\uff08\u8eab\u4efd\u9a8c\u8bc1\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u81ea\u5b9a\u4e49\u5b57\u7b26\u4e32<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u5728\u8bf7\u6c42\u65f6\u901a\u8fc7Header\u4f20\u9012\u76f8\u540c\u5bc6\u94a5\uff08\u5982Authorization: Bearer XnZ9qP7L&#8230;\uff09<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;enable-reasoning<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u542f\u7528\u63a8\u7406\u6a21\u5f0f\uff08\u53ef\u80fd\u5173\u8054\u4e2d\u95f4\u6b65\u9aa4\u8f93\u51fa\u6216\u7279\u5b9a\u903b\u8f91\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u65e0<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u6a21\u578b\u652f\u6301\uff08\u5982DeepSeek-R1\u53ef\u80fd\u5185\u7f6e\u63a8\u7406\u589e\u5f3a\u529f\u80fd\uff09<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;reasoning-parser deepseek_r1<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6307\u5b9a\u63a8\u7406\u7ed3\u679c\u7684\u89e3\u6790\u5668<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6a21\u578b\u76f8\u5173\u503c\uff08\u5982deepseek_r1\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u4e0e\u6a21\u578b\u914d\u5957\u4f7f\u7528\uff0c\u53ef\u80fd\u7528\u4e8e\u7ed3\u6784\u5316\u8f93\u51fa\uff08\u5982\u601d\u7ef4\u94fe\u3001\u5de5\u5177\u8c03\u7528\u7b49\uff09<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<pre class=\"wp-block-code\"><code>vllm serve DeepSeek-R1-Distill-Qwen-32B --host 0.0.0.0 --port 30041 --uvicorn-log-level info --pipeline-parallel-size 1 --tensor-parallel-size 2 --gpu-memory-utilization 0.9 --device cuda  --enable-prefix-caching --trust-remote-code --max-model-len 131072 --api-key \u4f60\u7684\u5bc6\u94a5 --enable-reasoning --reasoning-parser deepseek_r1<\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-6-1024x368.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"368\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-6-1024x368.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-102\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<h4 class=\"wp-block-heading\">\u6a21\u578b\u6d4b\u8bd5-Postman<\/h4>\n\n\n\n<p>\u8bf7\u6c42\u914d\u7f6e\u5982\u4e0b\uff1aMethod: POST URL: http:\/\/IP\u5730\u5740:\u7aef\u53e3\/v1\/chat\/completions<\/p>\n\n\n\n<p>Headers<\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th class=\"has-text-align-center\" data-align=\"center\">Key<\/th><th class=\"has-text-align-center\" data-align=\"center\">Value<\/th><\/tr><\/thead><tbody><tr><td class=\"has-text-align-center\" data-align=\"center\">Content-Type<\/td><td class=\"has-text-align-center\" data-align=\"center\">application\/json<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">Authorization<\/td><td class=\"has-text-align-center\" data-align=\"center\">Bearer \u542f\u52a8\u65f6\u5019\u7684\u5bc6\u94a5<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<pre class=\"wp-block-code\"><code>Request Body (JSON)\n{\n    \"model\": \"QwQ-32B\",\n    \"messages\": &#91;\n        {\"role\": \"system\", \"content\": \"\u4f60\u662f\u4e00\u4e2a\u4e25\u8c28\u7684AI\u52a9\u624b\"},\n        {\"role\": \"user\", \"content\": \"\u8bf7\u89e3\u91ca\u91cf\u5b50\u7ea0\u7f20\u73b0\u8c61\"}\n    ],\n    \"max_tokens\": 512,\n    \"temperature\": 0.3,\n    \"top_p\": 0.9,\n    \"reasoning\": true,\n    \"reasoning_parser\": \"deepseek_r1\",\n    \"stream\": false\n}<\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-7-1024x527.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"527\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-7-1024x527.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-107\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<h4 class=\"wp-block-heading\">OpenAI python\u6d4b\u8bd5<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>from openai import OpenAI\nclient = OpenAI(\n    api_key=\"\u4f60\u7684\u5bc6\u94a5\",\n    base_url=\"<span style=\"background-color: initial; font-family: inherit; font-size: inherit; color: initial;\">http:\/\/IP\u5730\u5740:\u7aef\u53e3<\/span>\/v1\"\n)\nmsg = \"\u4f60\u597d\uff1f\"\nmessages = &#91;{\"role\": \"user\", \"content\": msg}]\nresponse = client.chat.completions.create(\n    model=\"DeepSeek-R1-Distill-Qwen-32B\",\n    messages=messages,\n    stream=True,\n    stream_options={\"include_usage\": True}  # \u4fee\u6b63\u53c2\u6570\u540d\u4e2d\u7684\u4e0b\u5212\u7ebf\n)\nreasoning_content = \"\"\ncontent = \"\"\nfor chunk in response:\n    # \u5148\u68c0\u67e5\u662f\u5426\u5b58\u5728\u6709\u6548\u7684choices\n    if not chunk.choices or len(chunk.choices) == 0:\n        continue  # \u8df3\u8fc7\u7a7achoices\u7684chunk\n    delta = chunk.choices&#91;0].delta\n    # \u5904\u7406reasoning_content\n    if hasattr(delta, \"reasoning_content\") and delta.reasoning_content:\n        reasoning_content += delta.reasoning_content\n        print(f\"{delta.reasoning_content}\", end=\"\", flush=True)\n    # \u5904\u7406content\n    if hasattr(delta, \"content\") and delta.content:\n        content += delta.content\n        print(f\"{delta.content}\", end=\"\", flush=True)\n# \u53ef\u9009\uff1a\u6dfb\u52a0\u6700\u7ec8\u6362\u884c\nprint()<\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-8-1024x555.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"555\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-8-1024x555.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-108\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\">\u8bcd\u5d4c\u5165\u6a21\u578b<\/h3>\n\n\n\n<p>\u4ec5\u9700\u8981\u6dfb\u52a0-task embed\u53c2\u6570\u5373\u53ef\uff0c\u793a\u4f8b\u5982\u4e0b<\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th class=\"has-text-align-center\" data-align=\"center\">\u53c2\u6570<\/th><th class=\"has-text-align-center\" data-align=\"center\">\u63cf\u8ff0<\/th><th class=\"has-text-align-center\" data-align=\"center\">\u793a\u4f8b\/\u503c<\/th><th class=\"has-text-align-center\" data-align=\"center\">\u5907\u6ce8<\/th><\/tr><\/thead><tbody><tr><td class=\"has-text-align-center\" data-align=\"center\">bge-base-zh-v1.5<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u8981\u52a0\u8f7d\u7684\u6a21\u578b\u540d\u79f0<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u5fc5\u586b<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u4e2d\u6587\u6587\u672c\u5d4c\u5165\u6a21\u578b\uff0c\u652f\u6301\u4e2d\u82f1\u53cc\u8bed<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;host<\/td><td class=\"has-text-align-center\" data-align=\"center\">API \u670d\u52a1\u7ed1\u5b9a\u7684\u4e3b\u673a\u5730\u5740<\/td><td class=\"has-text-align-center\" data-align=\"center\">0.0.0.0<\/td><td class=\"has-text-align-center\" data-align=\"center\">0.0.0.0&nbsp;\u8868\u793a\u5141\u8bb8\u5916\u90e8\u8bbf\u95ee<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;port<\/td><td class=\"has-text-align-center\" data-align=\"center\">API \u670d\u52a1\u76d1\u542c\u7684\u7aef\u53e3\u53f7<\/td><td class=\"has-text-align-center\" data-align=\"center\">30049<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u81ea\u5b9a\u4e49\u7aef\u53e3\u9700\u786e\u4fdd\u672a\u88ab\u5360\u7528<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;gpu-memory-utilization<\/td><td class=\"has-text-align-center\" data-align=\"center\">GPU \u663e\u5b58\u5229\u7528\u7387\u76ee\u6807\uff080.0-1.0\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">0.9<\/td><td class=\"has-text-align-center\" data-align=\"center\">0.9 \u8868\u793a\u4f7f\u7528 90% \u7684\u53ef\u7528\u663e\u5b58<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;uvicorn-log-level<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u63a7\u5236 Uvicorn \u670d\u52a1\u5668\u7684\u65e5\u5fd7\u8f93\u51fa\u7ea7\u522b<\/td><td class=\"has-text-align-center\" data-align=\"center\">info<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u53ef\u9009\u503c\uff1adebug,&nbsp;info,&nbsp;warning,&nbsp;error,&nbsp;critical<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;dtype<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6a21\u578b\u6743\u91cd\u6570\u636e\u7c7b\u578b<\/td><td class=\"has-text-align-center\" data-align=\"center\">float16<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u534a\u7cbe\u5ea6\u6d6e\u70b9\uff0c\u53ef\u51cf\u5c11\u663e\u5b58\u5360\u7528<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;task<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u6307\u5b9a\u670d\u52a1\u4efb\u52a1\u7c7b\u578b<\/td><td class=\"has-text-align-center\" data-align=\"center\">embed<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u8868\u793a\u63d0\u4f9b\u5d4c\u5165\u751f\u6210\u670d\u52a1<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">&#8211;api-key<\/td><td class=\"has-text-align-center\" data-align=\"center\">API \u8bbf\u95ee\u5bc6\u94a5\uff08\u53ef\u9009\u5b89\u5168\u9a8c\u8bc1\uff09<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u81ea\u5b9a\u4e49\u5b57\u7b26\u4e32<\/td><td class=\"has-text-align-center\" data-align=\"center\">\u9700\u8981\u5ba2\u6237\u7aef\u5728\u8bf7\u6c42\u5934\u4e2d\u643a\u5e26\u6b64\u5bc6\u94a5<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<pre class=\"wp-block-code\"><code>vllm serve bge-base-zh-v1.5 --host 0.0.0.0 --port 30049 --gpu-memory-utilization 0.9 --uvicorn-log-level info --dtype float16 --task embed --api-key \u4f60\u7684\u5bc6\u94a5<\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-9-1024x343.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"343\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-9-1024x343.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-110\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<h4 class=\"wp-block-heading\">\u6a21\u578b\u6d4b\u8bd5-Postman<\/h4>\n\n\n\n<p>\u8bf7\u6c42\u914d\u7f6e\u5982\u4e0b\uff1aMethod: POST URL: http:\/\/IP\u5730\u5740:\u7aef\u53e3\/v1\/chat\/completions<\/p>\n\n\n\n<p>Headers<\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th class=\"has-text-align-center\" data-align=\"center\">Key<\/th><th class=\"has-text-align-center\" data-align=\"center\">Value<\/th><\/tr><\/thead><tbody><tr><td class=\"has-text-align-center\" data-align=\"center\">Content-Type<\/td><td class=\"has-text-align-center\" data-align=\"center\">application\/json<\/td><\/tr><tr><td class=\"has-text-align-center\" data-align=\"center\">Authorization<\/td><td class=\"has-text-align-center\" data-align=\"center\">Bearer \u542f\u52a8\u65f6\u5019\u7684\u5bc6\u94a5<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<pre class=\"wp-block-code\"><code>{\n    \"input\": &#91;\n        \"\u4f60\u597d\"\n    ],\n    \"model\": \"bge-base-zh-v1.5\"\n}<\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-11-1024x527.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"527\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-11-1024x527.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-112\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n\n\n\n<h4 class=\"wp-block-heading\">OpenAI Python\u6d4b\u8bd5<\/h4>\n\n\n\n<pre class=\"wp-block-code\"><code>from openai import OpenAI\n# Modify OpenAI's API key and API base to use vLLM's API server.\nopenai_api_key = \"\u4f60\u7684\u5bc6\u94a5\"\nopenai_api_base = \"<span style=\"background-color: initial; font-family: inherit; font-size: inherit; color: initial;\">http:\/\/IP\u5730\u5740:\u7aef\u53e3<\/span>\/v1\"\nclient = OpenAI(\n    # defaults to os.environ.get(\"OPENAI_API_KEY\")\n    api_key=openai_api_key,\n    base_url=openai_api_base,\n)\nmodels = client.models.list()\nmodel = models.data&#91;0].id\nresponses = client.embeddings.create(\n    input=&#91;\n        \"Hello my name is\",\n        \"The best thing about vLLM is that it supports many different models\"\n    ],\n    model=model,\n)\nfor data in responses.data:\n    print(data.embedding)  <\/code><\/pre>\n\n\n\n<figure class=\"wp-block-image size-large\"><div class='fancybox-wrapper lazyload-container-unload' data-fancybox='post-images' href='https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-12-1024x493.png'><img class=\"lazyload lazyload-style-1\" src=\"data:image\/svg+xml;base64,PCEtLUFyZ29uTG9hZGluZy0tPgo8c3ZnIHdpZHRoPSIxIiBoZWlnaHQ9IjEiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyIgc3Ryb2tlPSIjZmZmZmZmMDAiPjxnPjwvZz4KPC9zdmc+\"  loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"493\" data-original=\"https:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/image-12-1024x493.png\" src=\"data:image\/png;base64,iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAAJcEhZcwAADsQAAA7EAZUrDhsAAAANSURBVBhXYzh8+PB\/AAffA0nNPuCLAAAAAElFTkSuQmCC\" alt=\"\" class=\"wp-image-113\"  sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/div><\/figure>\n","protected":false},"excerpt":{"rendered":"<p>\u57fa\u7840\u4ecb\u7ecd Ollama\u4ecb\u7ecd \u8f7b\u91cf\u7ea7\u672c\u5730\u5316\u5de5\u5177\uff0c\u4e13\u4e3a\u4e2a\u4eba\u5f00\u53d1\u8005\u548c\u5c0f\u89c4\u6a21\u5b9e\u9a8c\u8bbe\u8ba1\uff0c\u4e3b\u6253\u5feb\u901f\u90e8\u7f72\u548c\u4f4e\u8d44\u6e90\u5360\u7528 \u6838\u5fc3\u4f18 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":122,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[1],"tags":[],"class_list":["post-85","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-model-serve"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v24.8.1 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848 - \u4eca\u5929\u5f00\u59cb\u5b66AI<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/\u4f7f\u7528vllm\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848\/\" \/>\n<meta property=\"og:locale\" content=\"zh_CN\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848 - \u4eca\u5929\u5f00\u59cb\u5b66AI\" \/>\n<meta property=\"og:description\" content=\"\u57fa\u7840\u4ecb\u7ecd Ollama\u4ecb\u7ecd \u8f7b\u91cf\u7ea7\u672c\u5730\u5316\u5de5\u5177\uff0c\u4e13\u4e3a\u4e2a\u4eba\u5f00\u53d1\u8005\u548c\u5c0f\u89c4\u6a21\u5b9e\u9a8c\u8bbe\u8ba1\uff0c\u4e3b\u6253\u5feb\u901f\u90e8\u7f72\u548c\u4f4e\u8d44\u6e90\u5360\u7528 \u6838\u5fc3\u4f18 [&hellip;]\" \/>\n<meta property=\"og:url\" content=\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/\u4f7f\u7528vllm\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848\/\" \/>\n<meta property=\"og:site_name\" content=\"\u4eca\u5929\u5f00\u59cb\u5b66AI\" \/>\n<meta property=\"article:published_time\" content=\"2025-04-01T09:35:07+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2025-04-04T03:07:16+00:00\" \/>\n<meta property=\"og:image\" content=\"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png\" \/>\n\t<meta property=\"og:image:width\" content=\"2384\" \/>\n\t<meta property=\"og:image:height\" content=\"904\" \/>\n\t<meta property=\"og:image:type\" content=\"image\/png\" \/>\n<meta name=\"author\" content=\"Knoka\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u4f5c\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"Knoka\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4\" \/>\n\t<meta name=\"twitter:data2\" content=\"4 \u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"Article\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#article\",\"isPartOf\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/\"},\"author\":{\"name\":\"Knoka\",\"@id\":\"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\"},\"headline\":\"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848\",\"datePublished\":\"2025-04-01T09:35:07+00:00\",\"dateModified\":\"2025-04-04T03:07:16+00:00\",\"mainEntityOfPage\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/\"},\"wordCount\":221,\"commentCount\":0,\"publisher\":{\"@id\":\"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\"},\"image\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage\"},\"thumbnailUrl\":\"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png\",\"articleSection\":[\"\u6a21\u578b\u90e8\u7f72\"],\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"CommentAction\",\"name\":\"Comment\",\"target\":[\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#respond\"]}]},{\"@type\":\"WebPage\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/\",\"url\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/\",\"name\":\"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848 - \u4eca\u5929\u5f00\u59cb\u5b66AI\",\"isPartOf\":{\"@id\":\"http:\/\/knoka.vip\/#website\"},\"primaryImageOfPage\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage\"},\"image\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage\"},\"thumbnailUrl\":\"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png\",\"datePublished\":\"2025-04-01T09:35:07+00:00\",\"dateModified\":\"2025-04-04T03:07:16+00:00\",\"breadcrumb\":{\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/\"]}]},{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage\",\"url\":\"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png\",\"contentUrl\":\"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png\",\"width\":2384,\"height\":904},{\"@type\":\"BreadcrumbList\",\"@id\":\"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"http:\/\/knoka.vip\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848\"}]},{\"@type\":\"WebSite\",\"@id\":\"http:\/\/knoka.vip\/#website\",\"url\":\"http:\/\/knoka.vip\/\",\"name\":\"\u4eca\u5929\u5f00\u59cb\u5b66AI\",\"description\":\"\u77e5\u8bc6\u5206\u4eab\",\"publisher\":{\"@id\":\"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\"},\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"http:\/\/knoka.vip\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"zh-Hans\"},{\"@type\":[\"Person\",\"Organization\"],\"@id\":\"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84\",\"name\":\"Knoka\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"http:\/\/knoka.vip\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404\",\"contentUrl\":\"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404\",\"caption\":\"Knoka\"},\"logo\":{\"@id\":\"http:\/\/knoka.vip\/#\/schema\/person\/image\/\"},\"sameAs\":[\"http:\/\/118.178.172.39\"],\"url\":\"http:\/\/knoka.vip\/index.php\/author\/admin\/\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848 - \u4eca\u5929\u5f00\u59cb\u5b66AI","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/\u4f7f\u7528vllm\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848\/","og_locale":"zh_CN","og_type":"article","og_title":"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848 - \u4eca\u5929\u5f00\u59cb\u5b66AI","og_description":"\u57fa\u7840\u4ecb\u7ecd Ollama\u4ecb\u7ecd \u8f7b\u91cf\u7ea7\u672c\u5730\u5316\u5de5\u5177\uff0c\u4e13\u4e3a\u4e2a\u4eba\u5f00\u53d1\u8005\u548c\u5c0f\u89c4\u6a21\u5b9e\u9a8c\u8bbe\u8ba1\uff0c\u4e3b\u6253\u5feb\u901f\u90e8\u7f72\u548c\u4f4e\u8d44\u6e90\u5360\u7528 \u6838\u5fc3\u4f18 [&hellip;]","og_url":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/\u4f7f\u7528vllm\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848\/","og_site_name":"\u4eca\u5929\u5f00\u59cb\u5b66AI","article_published_time":"2025-04-01T09:35:07+00:00","article_modified_time":"2025-04-04T03:07:16+00:00","og_image":[{"width":2384,"height":904,"url":"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png","type":"image\/png"}],"author":"Knoka","twitter_card":"summary_large_image","twitter_misc":{"\u4f5c\u8005":"Knoka","\u9884\u8ba1\u9605\u8bfb\u65f6\u95f4":"4 \u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"Article","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#article","isPartOf":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/"},"author":{"name":"Knoka","@id":"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84"},"headline":"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848","datePublished":"2025-04-01T09:35:07+00:00","dateModified":"2025-04-04T03:07:16+00:00","mainEntityOfPage":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/"},"wordCount":221,"commentCount":0,"publisher":{"@id":"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84"},"image":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage"},"thumbnailUrl":"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png","articleSection":["\u6a21\u578b\u90e8\u7f72"],"inLanguage":"zh-Hans","potentialAction":[{"@type":"CommentAction","name":"Comment","target":["http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#respond"]}]},{"@type":"WebPage","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/","url":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/","name":"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848 - \u4eca\u5929\u5f00\u59cb\u5b66AI","isPartOf":{"@id":"http:\/\/knoka.vip\/#website"},"primaryImageOfPage":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage"},"image":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage"},"thumbnailUrl":"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png","datePublished":"2025-04-01T09:35:07+00:00","dateModified":"2025-04-04T03:07:16+00:00","breadcrumb":{"@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/"]}]},{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#primaryimage","url":"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png","contentUrl":"http:\/\/knoka.vip\/wp-content\/uploads\/2025\/04\/\u5927\u6a21\u578b\u5e94\u7528\u6846\u67b6-1.png","width":2384,"height":904},{"@type":"BreadcrumbList","@id":"http:\/\/knoka.vip\/index.php\/2025\/04\/01\/%e4%bd%bf%e7%94%a8vllm%e9%83%a8%e7%bd%b2%e4%b8%80%e7%b3%bb%e5%88%97%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e6%96%b9%e6%a1%88\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"http:\/\/knoka.vip\/"},{"@type":"ListItem","position":2,"name":"\u4f7f\u7528VLLM\u90e8\u7f72\u4e00\u7cfb\u5217\u5927\u8bed\u8a00\u6a21\u578b\u65b9\u6848"}]},{"@type":"WebSite","@id":"http:\/\/knoka.vip\/#website","url":"http:\/\/knoka.vip\/","name":"\u4eca\u5929\u5f00\u59cb\u5b66AI","description":"\u77e5\u8bc6\u5206\u4eab","publisher":{"@id":"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"http:\/\/knoka.vip\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"zh-Hans"},{"@type":["Person","Organization"],"@id":"http:\/\/knoka.vip\/#\/schema\/person\/59bf442e4e4c21f6969b984b8c5bfc84","name":"Knoka","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"http:\/\/knoka.vip\/#\/schema\/person\/image\/","url":"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404","contentUrl":"https:\/\/gravatar.pho.ink\/avatar\/a81dd1238e551ec6c470995487946913852d59837b557d5166ae60169466da05?s=96&r=g&d=404","caption":"Knoka"},"logo":{"@id":"http:\/\/knoka.vip\/#\/schema\/person\/image\/"},"sameAs":["http:\/\/118.178.172.39"],"url":"http:\/\/knoka.vip\/index.php\/author\/admin\/"}]}},"_links":{"self":[{"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/posts\/85","targetHints":{"allow":["GET"]}}],"collection":[{"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/comments?post=85"}],"version-history":[{"count":0,"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/posts\/85\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/media\/122"}],"wp:attachment":[{"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/media?parent=85"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/categories?post=85"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/knoka.vip\/index.php\/wp-json\/wp\/v2\/tags?post=85"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}