{"id":108,"date":"2026-04-23T23:08:18","date_gmt":"2026-04-23T15:08:18","guid":{"rendered":"https:\/\/blog.nickys.cn\/?p=108"},"modified":"2026-04-24T22:40:43","modified_gmt":"2026-04-24T14:40:43","slug":"deepseek-v3%ef%bc%9a671b%e5%8f%82%e6%95%b0%e7%9a%84moe%e5%a4%a7%e6%a8%a1%e5%9e%8b%ef%bc%8c%e8%ae%ad%e7%bb%83%e6%88%90%e6%9c%ac%e4%bb%85557%e4%b8%87%e7%be%8e%e5%85%83","status":"publish","type":"post","link":"https:\/\/blog.nickys.cn\/?p=108","title":{"rendered":"DeepSeek-V3\uff1a671B\u53c2\u6570\uff0c\u8bad\u7ec3\u6210\u672c557\u4e07\u7f8e\u5143\uff0c\u51ed\u4ec0\u4e48\uff1f"},"content":{"rendered":"<style>\n.gpu-hero { background: linear-gradient(135deg, #0c0a1a 0%, #1a1145 50%, #0c0a1a 100%); padding: 48px 32px; text-align: center; border-radius: 16px; margin-bottom: 32px; }\n.gpu-hero h2 { color: #fff; font-size: 28px; margin: 0 0 12px; font-weight: 700; }\n.gpu-hero p { color: #94a3b8; font-size: 16px; margin: 0; line-height: 1.7; }\n.gpu-hero .badge { display: inline-block; background: linear-gradient(135deg, #a855f7, #7c3aed); color: #fff; padding: 4px 16px; border-radius: 20px; font-size: 13px; font-weight: 600; margin-bottom: 16px; }\n.gpu-stats { display: flex; justify-content: center; gap: 32px; margin-top: 24px; flex-wrap: wrap; }\n.gpu-stats .stat { text-align: center; }\n.gpu-stats .stat .num { font-size: 28px; font-weight: 800; color: #a855f7; }\n.gpu-stats .stat .label { font-size: 12px; color: #64748b; margin-top: 4px; }\n.gpu-table-wrap { border-radius: 12px; overflow: hidden; box-shadow: 0 4px 24px rgba(0,0,0,0.06); margin: 24px 0; }\n.gpu-table { width: 100%; border-collapse: collapse; font-size: 14px; }\n.gpu-table thead th { background: linear-gradient(135deg, #1a1145, #2d1b69); color: #fff; padding: 12px 10px; font-weight: 600; font-size: 13px; white-space: nowrap; }\n.gpu-table tbody td { padding: 10px; border-bottom: 1px solid #f1f5f9; text-align: center; }\n.gpu-table tbody td:first-child { text-align: left; font-weight: 600; }\n.gpu-table tbody tr:nth-child(even) { background: #f8fafc; }\n.gpu-table tbody tr:hover { background: #faf5ff; }\n.gpu-table .best { background: #f0fdf4 !important; }\n.gpu-table .best td { border-left: 3px solid #22c55e; }\n.gpu-table .winner { color: #16a34a; font-weight: 700; }\n.finding-card { border-radius: 12px; padding: 24px; margin: 16px 0; border-left: 4px solid; box-shadow: 0 2px 12px rgba(0,0,0,0.04); }\n.finding-card h4 { margin: 0 0 8px; font-size: 17px; font-weight: 700; }\n.finding-card p { margin: 0; color: #475569; line-height: 1.8; font-size: 15px; }\n.fc-red { background: #fef2f2; border-color: #ef4444; }\n.fc-red h4 { color: #dc2626; }\n.fc-green { background: #f0fdf4; border-color: #22c55e; }\n.fc-green h4 { color: #16a34a; }\n.fc-blue { background: #eff6ff; border-color: #3b82f6; }\n.fc-blue h4 { color: #2563eb; }\n.fc-orange { background: #fff7ed; border-color: #f97316; }\n.fc-orange h4 { color: #ea580c; }\n.fc-purple { background: #faf5ff; border-color: #a855f7; }\n.fc-purple h4 { color: #9333ea; }\n.fc-teal { background: #f0fdfa; border-color: #14b8a6; }\n.fc-teal h4 { color: #0d9488; }\n.tech-card { border-radius: 12px; padding: 20px 24px; margin: 12px 0; background: linear-gradient(135deg, #faf5ff, #f3e8ff); border-left: 4px solid #a855f7; }\n.tech-card h4 { margin: 0 0 8px; font-size: 16px; font-weight: 700; color: #7c3aed; }\n.tech-card p { margin: 0; color: #475569; line-height: 1.8; font-size: 15px; }\n.fw-card { border-radius: 12px; padding: 16px 20px; margin: 8px 0; display: flex; align-items: center; gap: 12px; background: #f8fafc; border: 1px solid #e2e8f0; }\n.fw-card .fw-name { background: #fff; border-radius: 8px; padding: 8px 14px; font-weight: 700; font-size: 14px; color: #7c3aed; box-shadow: 0 1px 4px rgba(0,0,0,0.08); min-width: 120px; text-align: center; }\n.fw-card .fw-desc { flex: 1; font-size: 14px; color: #475569; line-height: 1.6; }\n.summary-box { background: linear-gradient(135deg, #1a1145, #0c0a1a); border-radius: 16px; padding: 28px 32px; color: #e2e8f0; line-height: 1.9; font-size: 15px; margin: 24px 0; }\n.summary-box strong { color: #a855f7; }\n.note-box { background: #fffbeb; border: 1px solid #fde68a; border-radius: 12px; padding: 20px 24px; margin: 24px 0; }\n.note-box ul { margin: 8px 0 0 0; padding-left: 20px; color: #92400e; }\n.note-box li { margin: 6px 0; line-height: 1.7; }\n.link-row { display: flex; gap: 12px; flex-wrap: wrap; justify-content: center; margin: 16px 0; }\n.link-row a { display: inline-block; padding: 10px 24px; border-radius: 8px; background: linear-gradient(135deg, #7c3aed, #a855f7); color: #fff; text-decoration: none; font-weight: 600; font-size: 14px; transition: opacity 0.2s; }\n.link-row a:hover { opacity: 0.85; }\n@media (max-width: 640px) {\n.gpu-stats { gap: 16px; }\n.gpu-table { font-size: 12px; }\n.gpu-table thead th, .gpu-table tbody td { padding: 8px 6px; }\n.fw-card { flex-direction: column; align-items: flex-start; }\n.fw-card .fw-name { min-width: auto; }\n.link-row { flex-direction: column; align-items: center; }\n}\n<\/style>\n<div class=\"gpu-hero\">\n<div class=\"badge\">DeepSeek-V3 \u6280\u672f\u89e3\u8bfb<\/div>\n<h2>671B \u53c2\u6570\uff0c557 \u4e07\u7f8e\u5143\u8bad\u7ec3\u6210\u672c<\/h2>\n<p>MoE \u67b6\u6784 | FP8 \u6df7\u5408\u7cbe\u5ea6 | 14.8T token \u9884\u8bad\u7ec3 | 128K \u4e0a\u4e0b\u6587<br \/>\u8dd1\u5206\u538b\u7740 GPT-4o \u6253\uff0c\u8bad\u7ec3\u6210\u672c\u4e0d\u5230 LLaMA 3.1 \u7684\u4e94\u5206\u4e4b\u4e00<\/p>\n<div class=\"gpu-stats\">\n<div class=\"stat\">\n<div class=\"num\">671B<\/div>\n<div class=\"label\">\u603b\u53c2\u6570<\/div>\n<\/div>\n<div class=\"stat\">\n<div class=\"num\">37B<\/div>\n<div class=\"label\">\u6fc0\u6d3b\u53c2\u6570<\/div>\n<\/div>\n<div class=\"stat\">\n<div class=\"num\">$557\u4e07<\/div>\n<div class=\"label\">\u8bad\u7ec3\u6210\u672c<\/div>\n<\/div>\n<div class=\"stat\">\n<div class=\"num\">128K<\/div>\n<div class=\"label\">\u4e0a\u4e0b\u6587\u7a97\u53e3<\/div>\n<\/div>\n<\/div>\n<\/div>\n<h2 style=\"text-align:center; font-size:20px; color:#334155; margin-bottom:4px;\">\u67b6\u6784\u521b\u65b0<\/h2>\n<p style=\"text-align:center; color:#94a3b8; font-size:13px; margin-bottom:20px;\">\u4e09\u9879\u5173\u952e\u6280\u672f\uff0c\u89e3\u51b3 MoE \u8001\u95ee\u9898 + \u63a8\u7406\u6548\u7387 + \u8bad\u7ec3\u7a33\u5b9a\u6027<\/p>\n<div class=\"tech-card\">\n<h4>\u65e0\u8f85\u52a9\u635f\u5931\u7684\u8d1f\u8f7d\u5747\u8861<\/h4>\n<p>MoE \u6a21\u578b\u7684\u8001\u5927\u96be\u95ee\u9898\uff1a\u5404\u4e13\u5bb6\u8d1f\u8f7d\u4e0d\u5747\u8861\u3002\u4f20\u7edf\u505a\u6cd5\u662f\u52a0\u8f85\u52a9\u635f\u5931\u51fd\u6570\u5f3a\u5236\u5e73\u8861\uff0c\u4f46\u4f1a\u62d6\u7d2f\u6a21\u578b\u6027\u80fd\u3002DeepSeek-V3 \u76f4\u63a5\u53bb\u6389\u8f85\u52a9\u635f\u5931\uff0c\u7528\u65b0\u65b9\u6848\u5b9e\u73b0\u8d1f\u8f7d\u5747\u8861\uff0c\u6027\u80fd\u4e0d\u53d7\u5f71\u54cd\u3002<\/p>\n<\/div>\n<div class=\"tech-card\">\n<h4>\u591a token \u9884\u6d4b\uff08MTP\uff09<\/h4>\n<p>\u4e00\u822c\u6a21\u578b\u4e00\u6b21\u53ea\u9884\u6d4b\u4e0b\u4e00\u4e2a token\uff0cDeepSeek-V3 \u4e00\u6b21\u9884\u6d4b\u591a\u4e2a\u3002\u8bad\u7ec3\u65f6\u5b66\u5f97\u66f4\u6df1\uff0c\u63a8\u7406\u65f6\u53ef\u4ee5\u505a\u6295\u673a\u89e3\u7801\u52a0\u901f\u3002\u8bba\u6587\u9a8c\u8bc1\u4e86 MTP \u786e\u5b9e\u80fd\u63d0\u5347\u6548\u679c\u3002<\/p>\n<\/div>\n<div class=\"tech-card\">\n<h4>MLA + DeepSeekMoE\uff08\u7ee7\u627f V2\uff09<\/h4>\n<p>\u591a\u5934\u6f5c\u5728\u6ce8\u610f\u529b\uff08MLA\uff09\u538b\u7f29 KV \u7f13\u5b58\uff0c\u964d\u4f4e\u663e\u5b58\u5360\u7528\uff1bDeepSeekMoE \u7528\u7ec6\u7c92\u5ea6\u4e13\u5bb6+\u5171\u4eab\u4e13\u5bb6\u7ec4\u5408\uff0c\u6a21\u578b\u5bb9\u91cf\u5927\u4f46\u63a8\u7406\u4fbf\u5b9c\u3002V2 \u9a8c\u8bc1\u8fc7\u7684\u4e1c\u897f\u4e0d\u6298\u817e\uff0c\u76f4\u63a5\u7ee7\u627f\u3002<\/p>\n<\/div>\n<h2 style=\"text-align:center; font-size:20px; color:#334155; margin-top:32px; margin-bottom:4px;\">\u8bad\u7ec3\u6548\u7387<\/h2>\n<p style=\"text-align:center; color:#94a3b8; font-size:13px; margin-bottom:20px;\">\u7b2c\u4e00\u4e2a\u5728\u8d85\u5927\u89c4\u6a21\u6a21\u578b\u4e0a\u8dd1\u901a FP8 \u8bad\u7ec3\u7684\u56e2\u961f<\/p>\n<div class=\"finding-card fc-purple\">\n<h4>FP8 \u6df7\u5408\u7cbe\u5ea6\u8bad\u7ec3<\/h4>\n<p>\u4ee5\u524d\u5927\u5bb6\u89c9\u5f97 FP8 \u7cbe\u5ea6\u4e0d\u591f\u4e0d\u6562\u7528\uff0cDeepSeek-V3 \u7b2c\u4e00\u4e2a\u5728\u8d85\u5927\u89c4\u6a21\u4e0a\u8dd1\u901a\u4e86 FP8\uff0c\u6548\u679c\u6ca1\u95ee\u9898\u3002\u8fd9\u662f\u5b9e\u6253\u5b9e\u7684\u6280\u672f\u7a81\u7834\uff0c\u4ee5\u540e\u522b\u4eba\u4e5f\u80fd\u7528\u3002<\/p>\n<\/div>\n<div class=\"finding-card fc-blue\">\n<h4>\u8ba1\u7b97\u901a\u4fe1\u91cd\u53e0<\/h4>\n<p>MoE \u8bad\u7ec3\u74f6\u9888\u5728\u8de8\u8282\u70b9\u901a\u4fe1\u3002\u56e2\u961f\u4ece\u7b97\u6cd5\u3001\u6846\u67b6\u3001\u786c\u4ef6\u4e09\u5c42\u534f\u540c\u8bbe\u8ba1\uff0c\u51e0\u4e4e\u505a\u5230\u8ba1\u7b97\u548c\u901a\u4fe1\u5b8c\u5168\u91cd\u53e0\u2014\u2014\u901a\u4fe1\u4e0d\u518d\u62d6\u540e\u817f\u3002<\/p>\n<\/div>\n<div style=\"display:flex; justify-content:center; gap:24px; margin:24px 0; flex-wrap:wrap;\">\n<div style=\"text-align:center; background:#faf5ff; border-radius:12px; padding:20px 28px;\">\n<div style=\"font-size:24px; font-weight:800; color:#7c3aed;\">266.4\u4e07<\/div>\n<div style=\"font-size:12px; color:#64748b; margin-top:4px;\">H800 GPU\u5c0f\u65f6\uff08\u9884\u8bad\u7ec3\uff09<\/div>\n<\/div>\n<div style=\"text-align:center; background:#faf5ff; border-radius:12px; padding:20px 28px;\">\n<div style=\"font-size:24px; font-weight:800; color:#7c3aed;\">10\u4e07<\/div>\n<div style=\"font-size:12px; color:#64748b; margin-top:4px;\">GPU\u5c0f\u65f6\uff08\u540e\u8bad\u7ec3\uff09<\/div>\n<\/div>\n<div style=\"text-align:center; background:#faf5ff; border-radius:12px; padding:20px 28px;\">\n<div style=\"font-size:24px; font-weight:800; color:#7c3aed;\">$557\u4e07<\/div>\n<div style=\"font-size:12px; color:#64748b; margin-top:4px;\">\u603b\u6210\u672c<\/div>\n<\/div>\n<\/div>\n<p style=\"text-align:center; color:#64748b; font-size:14px; margin:0 0 24px;\">\u5bf9\u6bd4\uff1aMeta \u8bad\u7ec3 LLaMA 3.1 405B \u7528\u4e86\u7ea6 3000 \u4e07 GPU \u5c0f\u65f6\uff0cDeepSeek-V3 \u53c2\u6570\u66f4\u591a\uff0c\u6210\u672c\u4e0d\u5230\u4e94\u5206\u4e4b\u4e00<\/p>\n<div class=\"finding-card fc-teal\">\n<h4>\u4ece R1 \u84b8\u998f\u63a8\u7406\u80fd\u529b<\/h4>\n<p>DeepSeek-R1 \u662f\u4e13\u6ce8\u63a8\u7406\u7684\u957f\u94fe\u601d\u7ef4\u6a21\u578b\uff0c\u4f46\u8f93\u51fa\u5197\u957f\u3001\u98ce\u683c\u4e0d\u597d\u63a7\u5236\u3002V3 \u628a R1 \u7684\u9a8c\u8bc1\u548c\u53cd\u601d\u6a21\u5f0f\u84b8\u998f\u8fc7\u6765\uff0c\u4fdd\u7559\u63a8\u7406\u80fd\u529b\uff0c\u540c\u65f6\u63a7\u5236\u8f93\u51fa\u98ce\u683c\u548c\u957f\u5ea6\u3002\u76f8\u5f53\u4e8e\u628a\u7231\u5199\u957f\u7bc7\u5927\u8bba\u7684\u5b66\u9738\uff0c\u8c03\u6559\u6210\u7b54\u9898\u7cbe\u70bc\u7684\u8003\u8bd5\u9009\u624b\u3002<\/p>\n<\/div>\n<h2 style=\"text-align:center; font-size:20px; color:#334155; margin-top:32px; margin-bottom:4px;\">\u8dd1\u5206\u6210\u7ee9<\/h2>\n<p style=\"text-align:center; color:#94a3b8; font-size:13px; margin-bottom:20px;\">\u7eff\u8272\u6807\u6ce8 = \u8be5\u9879\u6700\u4f18 \/ \u6570\u636e\u5747\u4e3a\u767e\u5206\u5236\u5f97\u5206<\/p>\n<h3 style=\"text-align:center; color:#475569; font-size:16px; margin:20px 0 8px;\">\u7efc\u5408\u80fd\u529b vs \u5f00\u6e90\u6a21\u578b<\/h3>\n<div class=\"gpu-table-wrap\">\n<table class=\"gpu-table\">\n<thead>\n<tr>\n<th>\u8bc4\u6d4b<\/th>\n<th>Qwen2.5 72B<\/th>\n<th>LLaMA3.1 405B<\/th>\n<th>DeepSeek-V3<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr class=\"best\">\n<td>MMLU<\/td>\n<td>85.0<\/td>\n<td>84.4<\/td>\n<td class=\"winner\">87.1<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>MMLU-Pro<\/td>\n<td>58.3<\/td>\n<td>52.8<\/td>\n<td class=\"winner\">64.4<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>BBH<\/td>\n<td>79.8<\/td>\n<td>82.9<\/td>\n<td class=\"winner\">87.5<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>DROP<\/td>\n<td>80.6<\/td>\n<td>86.0<\/td>\n<td class=\"winner\">89.0<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<\/div>\n<h3 style=\"text-align:center; color:#475569; font-size:16px; margin:20px 0 8px;\">\u6570\u5b66\u548c\u4ee3\u7801\u80fd\u529b vs \u5f00\u6e90\u6a21\u578b<\/h3>\n<div class=\"gpu-table-wrap\">\n<table class=\"gpu-table\">\n<thead>\n<tr>\n<th>\u8bc4\u6d4b<\/th>\n<th>Qwen2.5 72B<\/th>\n<th>LLaMA3.1 405B<\/th>\n<th>DeepSeek-V3<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr class=\"best\">\n<td>MATH<\/td>\n<td>54.4<\/td>\n<td>49.0<\/td>\n<td class=\"winner\">61.6<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>GSM8K<\/td>\n<td>88.3<\/td>\n<td>83.5<\/td>\n<td class=\"winner\">89.3<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>HumanEval<\/td>\n<td>53.0<\/td>\n<td>54.9<\/td>\n<td class=\"winner\">65.2<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>LiveCodeBench<\/td>\n<td>12.9<\/td>\n<td>15.5<\/td>\n<td class=\"winner\">19.4<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<\/div>\n<h3 style=\"text-align:center; color:#475569; font-size:16px; margin:20px 0 8px;\">vs \u95ed\u6e90\u6a21\u578b<\/h3>\n<div class=\"gpu-table-wrap\">\n<table class=\"gpu-table\">\n<thead>\n<tr>\n<th>\u8bc4\u6d4b<\/th>\n<th>Claude-3.5-Sonnet<\/th>\n<th>GPT-4o<\/th>\n<th>DeepSeek-V3<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr class=\"best\">\n<td>MMLU<\/td>\n<td>88.3<\/td>\n<td>87.2<\/td>\n<td class=\"winner\">88.5<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>MATH-500<\/td>\n<td>78.3<\/td>\n<td>74.6<\/td>\n<td class=\"winner\">90.2<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>AIME 2024<\/td>\n<td>16.0<\/td>\n<td>9.3<\/td>\n<td class=\"winner\">39.2<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>LiveCodeBench<\/td>\n<td>36.3<\/td>\n<td>33.4<\/td>\n<td class=\"winner\">40.5<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>Codeforces<\/td>\n<td>20.3<\/td>\n<td>23.6<\/td>\n<td class=\"winner\">51.6<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<\/div>\n<h3 style=\"text-align:center; color:#475569; font-size:16px; margin:20px 0 8px;\">\u5f00\u653e\u5f0f\u5bf9\u8bdd\u8bc4\u6d4b<\/h3>\n<div class=\"gpu-table-wrap\">\n<table class=\"gpu-table\">\n<thead>\n<tr>\n<th>\u6a21\u578b<\/th>\n<th>Arena-Hard<\/th>\n<th>AlpacaEval 2.0<\/th>\n<\/tr>\n<\/thead>\n<tbody>\n<tr>\n<td>GPT-4o<\/td>\n<td>80.4<\/td>\n<td>51.1<\/td>\n<\/tr>\n<tr>\n<td>Claude-3.5-Sonnet<\/td>\n<td>85.2<\/td>\n<td>52.0<\/td>\n<\/tr>\n<tr class=\"best\">\n<td>DeepSeek-V3<\/td>\n<td class=\"winner\">85.5<\/td>\n<td class=\"winner\">70.0<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<\/div>\n<h2 style=\"text-align:center; font-size:20px; color:#334155; margin-top:32px; margin-bottom:4px;\">\u56db\u4e2a\u5173\u952e\u53d1\u73b0<\/h2>\n<div class=\"finding-card fc-red\">\n<h4>1. AIME 2024 \u7ade\u8d5b\u6570\u5b66\u78be\u538b<\/h4>\n<p>DeepSeek-V3 \u5f97\u5206 39.2\uff0cClaude-3.5-Sonnet \u53ea\u6709 16.0\uff0cGPT-4o \u53ea\u6709 9.3\u3002\u5dee\u8ddd\u4e0d\u662f\u4e00\u70b9\u534a\u70b9\uff0c\u662f\u6570\u91cf\u7ea7\u7684\u3002Codeforces \u7f16\u7a0b\u7ade\u8d5b 51.6 \u767e\u5206\u4f4d\uff0c\u5176\u4ed6\u4e24\u4e2a\u8fde 25 \u90fd\u5230\u4e0d\u4e86\u3002<\/p>\n<\/div>\n<div class=\"finding-card fc-green\">\n<h4>2. AlpacaEval 2.0 \u80dc\u7387 70.0<\/h4>\n<p>\u6bd4 GPT-4o\uff0851.1\uff09\u548c Claude-3.5-Sonnet\uff0852.0\uff09\u9ad8\u51fa\u5c06\u8fd1 20 \u4e2a\u70b9\u3002\u5728\u5f00\u653e\u5f0f\u5bf9\u8bdd\u8bc4\u6d4b\u4e2d\uff0cDeepSeek-V3 \u7684\u56de\u7b54\u8d28\u91cf\u660e\u663e\u66f4\u53d7\u504f\u597d\u3002<\/p>\n<\/div>\n<div class=\"finding-card fc-orange\">\n<h4>3. \u8bad\u7ec3\u6210\u672c\u53ea\u6709 LLaMA 3.1 \u7684 1\/5<\/h4>\n<p>Meta \u8bad\u7ec3 LLaMA 3.1 405B \u7528\u4e86\u7ea6 3000 \u4e07 GPU \u5c0f\u65f6\uff0cDeepSeek-V3 \u53c2\u6570\u66f4\u591a\uff08671B vs 405B\uff09\uff0c\u53ea\u7528\u4e86 278.8 \u4e07 GPU \u5c0f\u65f6\u3002FP8 + \u8ba1\u7b97\u901a\u4fe1\u91cd\u53e0\uff0c\u6548\u7387\u63d0\u5347\u5de8\u5927\u3002<\/p>\n<\/div>\n<div class=\"finding-card fc-purple\">\n<h4>4. \u4e8b\u5b9e\u6027\u95ee\u7b54\u8fd8\u6709\u77ed\u677f<\/h4>\n<p>SimpleQA \u7b49\u4e8b\u5b9e\u6027\u95ee\u7b54\u4e0a\u8fd8\u843d\u540e\u4e8e GPT-4o\uff0c\u8bf4\u660e\u77e5\u8bc6\u51c6\u786e\u6027\u8fd8\u6709\u63d0\u5347\u7a7a\u95f4\u3002\u4f46\u7efc\u5408\u6765\u770b\uff0c\u76ee\u524d\u6700\u5f3a\u5f00\u6e90\u5927\u6a21\u578b\u6ca1\u6709\u4e4b\u4e00\u3002<\/p>\n<\/div>\n<h2 style=\"text-align:center; font-size:20px; color:#334155; margin-top:32px; margin-bottom:4px;\">\u63a8\u7406\u6846\u67b6\u652f\u6301<\/h2>\n<p style=\"text-align:center; color:#94a3b8; font-size:13px; margin-bottom:16px;\">\u5b98\u65b9\u53ea\u63d0\u4f9b FP8 \u6743\u91cd\uff0c\u9700\u8981 BF16 \u53ef\u7528\u811a\u672c\u8f6c\u6362 \/ \u4ec5\u652f\u6301 Linux + Python 3.10<\/p>\n<div class=\"fw-card\">\n<div class=\"fw-name\">SGLang<\/div>\n<div class=\"fw-desc\">BF16\/FP8 \u63a8\u7406\uff0cMLA \u4f18\u5316\uff0cFP8 KV Cache\uff0cNVIDIA \u548c AMD GPU \u90fd\u652f\u6301<\/div>\n<\/div>\n<div class=\"fw-card\">\n<div class=\"fw-name\">vLLM<\/div>\n<div class=\"fw-desc\">FP8\/BF16\uff0c\u5f20\u91cf\u5e76\u884c+\u6d41\u6c34\u7ebf\u5e76\u884c\uff0c\u591a\u673a\u90e8\u7f72<\/div>\n<\/div>\n<div class=\"fw-card\">\n<div class=\"fw-name\">LMDeploy<\/div>\n<div class=\"fw-desc\">FP8\/BF16 \u63a8\u7406\uff0c\u672c\u5730\u548c\u4e91\u7aef\u90fd\u80fd\u8dd1<\/div>\n<\/div>\n<div class=\"fw-card\">\n<div class=\"fw-name\">TensorRT-LLM<\/div>\n<div class=\"fw-desc\">BF16 \u63a8\u7406\uff0cINT4\/8 \u91cf\u5316\uff0cFP8 \u8fd8\u5728\u5f00\u53d1\u4e2d<\/div>\n<\/div>\n<div class=\"fw-card\">\n<div class=\"fw-name\">LightLLM<\/div>\n<div class=\"fw-desc\">\u5355\u673a\/\u591a\u673a\u5f20\u91cf\u5e76\u884c<\/div>\n<\/div>\n<div class=\"fw-card\">\n<div class=\"fw-name\">\u534e\u4e3a\u6607\u817e NPU<\/div>\n<div class=\"fw-desc\">\u901a\u8fc7 MindIE \u6846\u67b6\uff0cINT8 \u548c BF16<\/div>\n<\/div>\n<div class=\"link-row\">\n<a href=\"https:\/\/chat.deepseek.com\/\">\u5728\u7ebf\u804a\u5929<\/a><br \/>\n<a href=\"https:\/\/platform.deepseek.com\/\">API \u63a5\u53e3<\/a><br \/>\n<a href=\"https:\/\/huggingface.co\/deepseek-ai\/DeepSeek-V3-Base\">Base \u6a21\u578b<\/a><br \/>\n<a href=\"https:\/\/huggingface.co\/deepseek-ai\/DeepSeek-V3\">Chat \u6a21\u578b<\/a><br \/>\n<a href=\"https:\/\/arxiv.org\/abs\/2412.19437\">\u8bba\u6587\u539f\u6587<\/a>\n<\/div>\n<div class=\"note-box\">\n<strong style=\"color:#92400e;\">\u8bb8\u53ef\u8bc1<\/strong><\/p>\n<ul>\n<li>\u4ee3\u7801\uff1aMIT \u8bb8\u53ef\u8bc1<\/li>\n<li>\u6a21\u578b\uff1a\u81ea\u6709\u8bb8\u53ef\u8bc1\uff0c\u652f\u6301\u5546\u4e1a\u4f7f\u7528<\/li>\n<li>\u6a21\u578b\u603b\u5927\u5c0f 685B\uff08671B \u4e3b\u6a21\u578b\u6743\u91cd + 14B \u591a token \u9884\u6d4b\u6a21\u5757\u6743\u91cd\uff09<\/li>\n<\/ul>\n<\/div>\n<div class=\"summary-box\">\n<strong>\u4e00\u53e5\u8bdd\u603b\u7ed3\uff1a<\/strong>DeepSeek-V3 \u6700\u8ba9\u4eba\u610f\u5916\u7684\u4e0d\u662f\u8dd1\u5206\uff0c\u800c\u662f\u8bad\u7ec3\u6210\u672c\u3002557 \u4e07\u7f8e\u5143\u8bad\u7ec3\u4e00\u4e2a 671B \u7684\u6a21\u578b\uff0c\u8dd1\u5206\u538b\u7740 GPT-4o \u6253\uff0c\u8fd9\u5728\u4e00\u5e74\u524d\u6839\u672c\u4e0d\u6562\u60f3\u3002\u65e0\u8f85\u52a9\u635f\u5931\u8d1f\u8f7d\u5747\u8861\u89e3\u51b3\u4e86 MoE \u8001\u5927\u96be\u95ee\u9898\uff0cFP8 \u8bad\u7ec3\u8dd1\u901a\u8d85\u5927\u6a21\u578b\uff0c\u4ece R1 \u84b8\u998f\u63a8\u7406\u80fd\u529b\u601d\u8def\u5de7\u5999\uff0c\u8bad\u7ec3\u5168\u7a0b\u96f6\u4e8b\u6545\u2014\u2014\u5de5\u7a0b\u80fd\u529b\u786e\u5b9e\u786c\u3002<\/p>\n<p><em style=\"color:#64748b;\">\u8bba\u6587\u5730\u5740\uff1aarxiv.org\/abs\/2412.19437 | \u6a21\u578b\u6743\u91cd\uff1aHuggingFace deepseek-ai | \u6570\u636e\u6765\u6e90\uff1aDeepSeek-V3 \u6280\u672f\u8bba\u6587<\/em>\n<\/p>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>DeepSeek-V3 \u6280\u672f\u89e3\u8bfb 671B \u53c2\u6570\uff0c557 \u4e07\u7f8e\u5143\u8bad\u7ec3\u6210\u672c MoE \u67b6\u6784 | FP8 \u6df7\u5408\u7cbe\u5ea6  &#8230; <a title=\"DeepSeek-V3\uff1a671B\u53c2\u6570\uff0c\u8bad\u7ec3\u6210\u672c557\u4e07\u7f8e\u5143\uff0c\u51ed\u4ec0\u4e48\uff1f\" class=\"read-more\" href=\"https:\/\/blog.nickys.cn\/?p=108\" aria-label=\"\u9605\u8bfb DeepSeek-V3\uff1a671B\u53c2\u6570\uff0c\u8bad\u7ec3\u6210\u672c557\u4e07\u7f8e\u5143\uff0c\u51ed\u4ec0\u4e48\uff1f\">\u9605\u8bfb\u66f4\u591a<\/a><\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[2],"tags":[],"class_list":["post-108","post","type-post","status-publish","format-standard","hentry","category-tech"],"_links":{"self":[{"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=\/wp\/v2\/posts\/108","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=108"}],"version-history":[{"count":2,"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=\/wp\/v2\/posts\/108\/revisions"}],"predecessor-version":[{"id":144,"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=\/wp\/v2\/posts\/108\/revisions\/144"}],"wp:attachment":[{"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=108"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=108"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/blog.nickys.cn\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=108"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}