{"id":4453,"date":"2025-10-22T17:16:38","date_gmt":"2025-10-22T09:16:38","guid":{"rendered":"https:\/\/www.ihub1.com\/?p=4453"},"modified":"2025-10-22T17:18:08","modified_gmt":"2025-10-22T09:18:08","slug":"%e9%98%bf%e9%87%8c%e4%ba%91%e7%a7%98%e5%af%86%e6%ad%a6%e5%99%a8%e4%ba%ae%e7%9b%b8%e9%a1%b6%e4%bc%9a%ef%bc%9a%e7%8b%82%e7%a0%8d82%e8%8b%b1%e4%bc%9f%e8%be%be%e5%90%ab%e9%87%8f%ef%bc%8c213%e5%9d%97gpu","status":"publish","type":"post","link":"https:\/\/www.ihub1.com\/index.php\/2025\/10\/22\/%e9%98%bf%e9%87%8c%e4%ba%91%e7%a7%98%e5%af%86%e6%ad%a6%e5%99%a8%e4%ba%ae%e7%9b%b8%e9%a1%b6%e4%bc%9a%ef%bc%9a%e7%8b%82%e7%a0%8d82%e8%8b%b1%e4%bc%9f%e8%be%be%e5%90%ab%e9%87%8f%ef%bc%8c213%e5%9d%97gpu\/","title":{"rendered":"\u963f\u91cc\u4e91\u79d8\u5bc6\u6b66\u5668\u4eae\u76f8\u9876\u4f1a\uff1a\u72c2\u780d82%\u82f1\u4f1f\u8fbe\u542b\u91cf\uff0c213\u5757GPU\u5e72\u4e861192\u5757\u7684\u6d3b"},"content":{"rendered":"\t\t<div data-elementor-type=\"wp-post\" data-elementor-id=\"4453\" class=\"elementor elementor-4453\">\n\t\t\t\t<div class=\"elementor-element elementor-element-c437474 e-flex e-con-boxed e-con e-parent\" data-id=\"c437474\" data-element_type=\"container\" data-e-type=\"container\">\n\t\t\t\t\t<div class=\"e-con-inner\">\n\t\t\t\t<div class=\"elementor-element elementor-element-62fb533 elementor-widget elementor-widget-text-editor\" data-id=\"62fb533\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"text-editor.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t\t\t\t\t<p>\u963f\u91cc\u4e91\u79d8\u5bc6\u6b66\u5668\u4eae\u76f8\u9876\u4f1a SOSP\uff1a\u7528\u65b0\u6280\u672f\u780d\u6389 82% \u7684\u82f1\u4f1f\u8fbe GPU \u9700\u6c42\u3002<\/p><p>\u4e00\u65f6\u5f15\u8d77\u4e0d\u5c0f\u5173\u6ce8\u4e0e\u8ba8\u8bba\u3002<\/p><div id=\"id_imagebox_0\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_0\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a839f_1024.jpg\" data-height=\"214\" data-width=\"1426\" \/><\/div><\/div><p>\u8fd9\u9879\u7814\u7a76\u7531\u963f\u91cc\u5df4\u5df4\u4e0e\u5317\u5927\u5408\u4f5c\uff0c\u963f\u91cc\u4e91 CTO \u5468\u9756\u4eba\u5e26\u961f\u3002<\/p><p>\u7814\u7a76\u63d0\u51fa\u6700\u65b0 GPU \u6c60\u5316\u7cfb\u7edf Aegaeon\uff0c\u7528 token \u7ea7\u522b\u7684\u81ea\u52a8\u6269\u7f29\u5bb9\u6280\u672f\uff0c\u786c\u662f\u628a GPU \u4f7f\u7528\u91cf\u4ece 1192 \u4e2a &#8221; \u7626\u8eab &#8221; \u5230 213 \u4e2a\u3002<\/p><div id=\"id_imagebox_1\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_1\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a83a0_1024.jpg\" data-height=\"514\" data-width=\"1754\" \/><\/div><\/div><p>\u8fd9\u9879\u7814\u7a76\u51fa\u53d1\u70b9\u5728\u5bf9\u963f\u91cc\u4e91\u81ea\u8eab\u4e1a\u52a1\u4e00\u9879\u89c2\u5bdf\u3002<\/p><p>\u5728 Model Studio\uff08\u767e\u70bc\u5e73\u53f0\uff09\u4e0a\uff0c\u4ed6\u4eec\u53d1\u73b0\u4e86\u4e00\u4e2a\u8ba9\u4eba\u5934\u75bc\u7684\u73b0\u8c61\uff1a17.7% \u7684 GPU \u88ab\u5206\u914d\u53bb\u670d\u52a1\u90a3\u4e9b\u51e0\u4e4e\u6ca1\u4eba\u7528\u7684\u51b7\u95e8\u6a21\u578b\uff0c\u800c\u8fd9\u4e9b\u6a21\u578b\u53ea\u5904\u7406\u4e86\u603b\u8bf7\u6c42\u91cf\u7684 1.35%\u3002<\/p><p>\u4e4b\u524d\u8981\u540c\u65f6\u8fd0\u884c\u8fd9\u4e9b\u6a21\u578b\u65f6\uff0c\u8981\u4e48\u7ed9\u6bcf\u4e2a\u6a21\u578b\u5355\u72ec\u5206\u914d GP\uff0c\u5f88\u591a\u51b7\u95e8\u6a21\u578b\u7684 GPU \u7ecf\u5e38\u7a7a\u7740\u6d6a\u8d39\uff0c\u8981\u4e48\u7528\u65e7\u65b9\u6cd5\u8ba9\u4e00\u4e2a GPU \u8dd1 2-3 \u4e2a\u6a21\u578b\uff08\u56e0\u4e3a GPU \u5185\u5b58\u4e0d\u591f\uff0c\u8dd1\u4e0d\u4e86\u66f4\u591a\uff09\uff0c\u603b\u4e4b\u8d44\u6e90\u5229\u7528\u7387\u7279\u522b\u4f4e\u3002<\/p><p>Aegaeon \u7784\u51c6\u8fd9\u4e00\u75db\u70b9\uff0c\u901a\u8fc7\u7cbe\u7ec6\u5316\u7684\u8d44\u6e90\u8c03\u5ea6\uff0c\u5f7b\u5e95\u6539\u53d8\u4e86 GPU \u8d44\u6e90\u5206\u914d\u7684\u6e38\u620f\u89c4\u5219\u3002<\/p><p>\u51b7\u95e8\u6a21\u578b\u5360\u7528\u957f\u5c3e\u8d44\u6e90<\/p><p>\u5177\u4f53\u6765\u8bf4\uff0c\u5728\u4ed6\u4eec\u7edf\u8ba1\u7684 779 \u4e2a\u6a21\u578b\u4e2d\uff0c\u6709 94.1% \u7684\u6a21\u578b\u5c5e\u4e8e\u957f\u5c3e\u6a21\u578b\uff0c\u5e73\u5747\u6bcf\u79d2\u8bf7\u6c42\u91cf\u4e0d\u5230 0.2 \u4e2a\u3002<\/p><div id=\"id_imagebox_2\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_2\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a83a1_1024.jpg\" data-height=\"870\" data-width=\"1276\" \/><\/div><\/div><p>\u4e0e\u6b64\u540c\u65f6\uff0c\u90a3\u4e9b\u70ed\u95e8\u6a21\u578b\u6bd4\u5982 DeepSeek \u548c\u901a\u4e49\u5343\u95ee\u867d\u7136\u8bf7\u6c42\u91cf\u5927\uff0c\u4f46\u4e5f\u7ecf\u5e38\u51fa\u73b0\u7a81\u53d1\u6d41\u91cf\uff0c\u5bfc\u81f4\u9884\u7559\u7684 GPU \u8d44\u6e90\u65f6\u800c\u8fc7\u8f7d\u3001\u65f6\u800c\u95f2\u7f6e\u3002<\/p><p>\u5982\u679c\u6309\u7167\u7406\u60f3\u60c5\u51b5\u8ba1\u7b97\uff0c\u5355\u4e2a GPU \u6bcf\u79d2\u5e94\u8be5\u80fd\u5904\u7406\u597d\u51e0\u4e2a\u8bf7\u6c42\uff0c\u8fd9\u610f\u5473\u7740\u5f53\u524d\u7684\u8d44\u6e90\u5229\u7528\u7387\u8fd8\u6709\u8d85\u8fc7 10 \u500d\u7684\u4f18\u5316\u7a7a\u95f4\u3002<\/p><div id=\"id_imagebox_3\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_3\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a83a2_1024.jpg\" data-height=\"410\" data-width=\"724\" \/><\/div><\/div><p>\u4f20\u7edf\u7684\u505a\u6cd5\u662f\u7ed9\u6bcf\u4e2a\u6a21\u578b\u5206\u914d\u4e13\u7528 GPU\uff0c\u4f46\u8fd9\u79cd &#8221; \u4e00\u5bf9\u4e00 &#8221; \u7684\u670d\u52a1\u6a21\u5f0f\u5728\u9762\u5bf9\u5927\u91cf\u5076\u53d1\u6027\u8bf7\u6c42\u65f6\uff0c\u7b80\u76f4\u5c31\u662f\u5728\u70e7\u94b1\u3002<\/p><p>Token \u7ea7\u522b\u8c03\u5ea6\uff0c\u8ba9 GPU&#8221; \u89c1\u7f1d\u63d2\u9488 &#8220;<\/p><p>Aegaeon \u7684\u6838\u5fc3\u521b\u65b0\u5728\u4e8e\u91c7\u7528\u4e86 token \u7ea7\u522b\u7684\u81ea\u52a8\u6269\u7f29\u5bb9\u6280\u672f\uff0c\u800c\u4e0d\u662f\u50cf\u73b0\u6709\u7cfb\u7edf\u90a3\u6837\u5728\u8bf7\u6c42\u7ea7\u522b\u8fdb\u884c\u8c03\u5ea6\u3002<\/p><p>\u5177\u4f53\u6765\u8bf4\uff0c\u7cfb\u7edf\u4f1a\u5728\u751f\u6210\u6bcf\u4e2a token \u65f6\u52a8\u6001\u51b3\u5b9a\u662f\u5426\u9700\u8981\u5207\u6362\u6a21\u578b\uff0c\u800c\u4e0d\u662f\u7b49\u5230\u6574\u4e2a\u8bf7\u6c42\u5904\u7406\u5b8c\u624d\u8003\u8651\u5207\u6362\u3002<\/p><p>\u5982\u6b64\u4e00\u6765\uff0c\u53ef\u4ee5\u8ba9\u8ba9 GPU \u7075\u6d3b\u5904\u7406\u591a\u4e2a\u6a21\u578b\u7684\u8bf7\u6c42\uff0c\u5927\u5927\u51cf\u5c11\u4e86\u6a21\u578b\u4e4b\u95f4\u7684\u7b49\u5f85\u65f6\u95f4\u3002\u8bba\u6587\u663e\u793a\uff0c\u901a\u8fc7\u8fd9\u79cd\u65b9\u5f0f\uff0c\u5355\u4e2a GPU \u53ef\u4ee5\u540c\u65f6\u670d\u52a1\u591a\u8fbe 7 \u4e2a\u4e0d\u540c\u7684\u6a21\u578b\u3002<\/p><div id=\"id_imagebox_4\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_4\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a83a3_1024.jpg\" data-height=\"866\" data-width=\"656\" \/><\/div><\/div><p>\u4e3a\u4e86\u5b9e\u73b0\u8fd9\u4e2a\u76ee\u6807\uff0c\u7814\u7a76\u56e2\u961f\u8fd8\u8fdb\u884c\u4e86\u4e00\u7cfb\u5217\u5e95\u5c42\u4f18\u5316\uff1a<\/p><p>\u901a\u8fc7\u7ec4\u4ef6\u590d\u7528\u51cf\u5c11\u4e86 80% \u7684\u521d\u59cb\u5316\u5f00\u9500\uff1b<\/p><p>\u91c7\u7528\u663e\u5f0f\u5185\u5b58\u7ba1\u7406\u907f\u514d\u4e86\u5185\u5b58\u788e\u7247\uff1b<\/p><p>\u5b9e\u73b0\u4e86\u7ec6\u7c92\u5ea6\u7684 KV \u7f13\u5b58\u540c\u6b65\u673a\u5236\uff0c\u8ba9\u6a21\u578b\u5207\u6362\u65f6\u95f4\u4ece\u51e0\u5341\u79d2\u7f29\u77ed\u5230 1 \u79d2\u4ee5\u5185\u3002<\/p><p>\u6574\u4f53\u6765\u770b\uff0c\u8fd9\u4e9b\u4f18\u5316\u5c06\u81ea\u52a8\u6269\u7f29\u5bb9\u7684\u5f00\u9500\u964d\u4f4e\u4e86 97%\u3002<\/p><div id=\"id_imagebox_5\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_5\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a83a4_1024.jpg\" data-height=\"732\" data-width=\"982\" \/><\/div><\/div><p>\u5b9e\u6218\u6548\u679c\uff1a\u541e\u5410\u91cf\u63d0\u5347 9 \u500d<\/p><p>Aegaeon \u5c55\u73b0\u51fa\u6700\u9ad8\u53ef\u8fbe 9 \u500d\u7684\u6027\u80fd\u63d0\u5347\uff0c\u6700\u4f4e\u4e5f\u6709 1.5 \u500d\uff0c\u8ba1\u7b97\u8d44\u6e90\u5f97\u5230\u4e86\u6781\u5927\u7684\u4f18\u5316\u3002<\/p><p>\u6839\u636e\u8bba\u6587\u6570\u636e\uff0c\u4e0e\u73b0\u6709\u7684 ServerlessLLM \u548c MuxServe \u7b49\u7cfb\u7edf\u76f8\u6bd4\uff0cAegaeon \u80fd\u591f\u652f\u6491 2-2.5 \u500d\u7684\u8bf7\u6c42\u5230\u8fbe\u7387\uff0c\u6709\u6548\u541e\u5410\u91cf\uff08goodput\uff09\u63d0\u5347\u4e86 1.5 \u5230 9 \u500d\u3002\u5728\u6d4b\u8bd5\u73af\u5883\u4e2d\uff0c\u4f7f\u7528 16 \u5757 H800 GPU \u7684\u96c6\u7fa4\uff0c\u7cfb\u7edf\u6210\u529f\u670d\u52a1\u4e86\u4ece 6B \u5230 72B \u53c2\u6570\u89c4\u6a21\u7684\u591a\u4e2a\u6a21\u578b\u3002<\/p><div id=\"id_imagebox_6\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_6\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a83a5_1024.jpg\" data-height=\"680\" data-width=\"1342\" \/><\/div><\/div><p>\u66f4\u91cd\u8981\u7684\u662f\uff0c\u8fd9\u5957\u7cfb\u7edf\u5df2\u7ecf\u5728\u963f\u91cc\u4e91\u767e\u70bc\u5e73\u53f0\u8fdb\u884c\u4e86\u8d85\u8fc7 3 \u4e2a\u6708\u7684\u751f\u4ea7\u73af\u5883\u6d4b\u8bd5\u3002<\/p><p>\u5728\u5b9e\u9645\u90e8\u7f72\u4e2d\uff0c\u5b83\u670d\u52a1\u4e86 47 \u4e2a\u4e0d\u540c\u89c4\u6a21\u7684\u6a21\u578b\uff0c\u5305\u62ec 28 \u4e2a 1.8B-7B \u7684\u5c0f\u6a21\u578b\u548c 19 \u4e2a 32B-72B \u7684\u5927\u6a21\u578b\u3002GPU \u5229\u7528\u7387\u4ece\u4e4b\u524d\u7684 13.3%-33.9% \u63d0\u5347\u5230\u4e86 48.1%\uff0c\u671f\u95f4\u6ca1\u6709\u51fa\u73b0\u4efb\u4f55 SLO \u8fdd\u89c4\u6216\u670d\u52a1\u4e2d\u65ad\u3002<\/p><div id=\"id_imagebox_7\" class=\"img_box \"><div class=\"content_img_div perview_img_div\"><img decoding=\"async\" id=\"img_7\" class=\"opacity_0\" src=\"https:\/\/zkres1.myzaker.com\/202510\/68f81cec8e9f09311f7a83a6_1024.jpg\" data-height=\"484\" data-width=\"680\" \/><\/div><\/div>\t\t\t\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t","protected":false},"excerpt":{"rendered":"<p>\u68a6\u6668 \u53d1\u81ea \u51f9\u975e\u5bfa<\/p>\n","protected":false},"author":1,"featured_media":4455,"comment_status":"closed","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[1],"tags":[],"class_list":["post-4453","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-uncategorized"],"aioseo_notices":[],"_links":{"self":[{"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/posts\/4453","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/comments?post=4453"}],"version-history":[{"count":7,"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/posts\/4453\/revisions"}],"predecessor-version":[{"id":4461,"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/posts\/4453\/revisions\/4461"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/media\/4455"}],"wp:attachment":[{"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/media?parent=4453"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/categories?post=4453"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.ihub1.com\/index.php\/wp-json\/wp\/v2\/tags?post=4453"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}