{"id":23228,"date":"2024-12-18T15:06:56","date_gmt":"2024-12-18T07:06:56","guid":{"rendered":"http:\/\/139.9.1.231\/?p=23228"},"modified":"2024-12-18T15:06:58","modified_gmt":"2024-12-18T07:06:58","slug":"qwen2-5-report","status":"publish","type":"post","link":"http:\/\/139.9.1.231\/index.php\/2024\/12\/18\/qwen2-5-report\/","title":{"rendered":"Qwen2.5 -\u6280\u672f\u62a5\u544a"},"content":{"rendered":"\n<div class=\"wp-block-image\"><figure class=\"aligncenter is-resized\"><img loading=\"lazy\" src=\"https:\/\/qianwen-res.oss-accelerate-overseas.aliyuncs.com\/assets\/logo\/qwen2.5_logo.png\" alt=\"Qwen2.5\" width=\"358\" height=\"126\"\/><\/figure><\/div>\n\n\n\n<p class=\"has-text-align-center\">\ud83e\udd17\u00a0<a href=\"https:\/\/huggingface.co\/Qwen\">Hugging Face<\/a>\u00a0\u00a0 | \u00a0\u00a0\ud83e\udd16\u00a0<a href=\"https:\/\/modelscope.cn\/organization\/qwen\">ModelScope<\/a>\u00a0\u00a0 | \u00a0\u00a0 \ud83d\udcd1 Paper (\u62a5\u544a\u8fd8\u672a\u53d1\u5e03) \u00a0\u00a0 | \u00a0\u00a0 \ud83d\udcd1\u00a0<a href=\"https:\/\/qwenlm.github.io\/blog\/qwen2.5\/\">Blog<\/a>\u00a0\u00a0\u00a0                      \ud83d\udcd6\u00a0<a href=\"https:\/\/qwen.readthedocs.io\/\">Documentation<\/a>\u00a0\u00a0 |\ud83d\udda5\ufe0f\u00a0<a href=\"https:\/\/huggingface.co\/spaces\/Qwen\/Qwen2.5-72B-Instruct\">Demo<\/a>\u00a0\u00a0 |     <a href=\"https:\/\/qwenlm.github.io\/\">\u535a\u5ba2<\/a>    |    <a href=\"https:\/\/github.com\/QwenLM\">GitHub<\/a><\/p>\n\n\n\n<p>Qwen\u662f\u963f\u91cc\u5df4\u5df4\u96c6\u56e2Qwen\u56e2\u961f\u7814\u53d1\u7684\u5927\u8bed\u8a00\u6a21\u578b\u548c\u5927\u578b\u591a\u6a21\u6001\u6a21\u578b\u7cfb\u5217\u3002\u76ee\u524d\uff0c\u5927\u8bed\u8a00\u6a21\u578b\u5df2\u5347\u7ea7\u81f3Qwen2.5\u7248\u672c\u3002\u65e0\u8bba\u662f\u8bed\u8a00\u6a21\u578b\u8fd8\u662f\u591a\u6a21\u6001\u6a21\u578b\uff0c\u5747\u5728\u5927\u89c4\u6a21\u591a\u8bed\u8a00\u548c\u591a\u6a21\u6001\u6570\u636e\u4e0a\u8fdb\u884c\u9884\u8bad\u7ec3\uff0c\u5e76\u901a\u8fc7\u9ad8\u8d28\u91cf\u6570\u636e\u8fdb\u884c\u540e\u671f\u5fae\u8c03\u4ee5\u8d34\u8fd1\u4eba\u7c7b\u504f\u597d\u3002Qwen\u5177\u5907\u81ea\u7136\u8bed\u8a00\u7406\u89e3\u3001\u6587\u672c\u751f\u6210\u3001\u89c6\u89c9\u7406\u89e3\u3001\u97f3\u9891\u7406\u89e3\u3001\u5de5\u5177\u4f7f\u7528\u3001\u89d2\u8272\u626e\u6f14\u3001\u4f5c\u4e3aAI Agent\u8fdb\u884c\u4e92\u52a8\u7b49\u591a\u79cd\u80fd\u529b\u3002<\/p>\n\n\n\n<p>\u6700\u65b0\u7248\u672cQwen2.5\u6709\u4ee5\u4e0b\u7279\u70b9\uff1a<\/p>\n\n\n\n<ul><li>\u6613\u4e8e\u4f7f\u7528\u7684\u4ec5\u89e3\u7801\u5668\u7a20\u5bc6\u8bed\u8a00\u6a21\u578b\uff0c\u63d0\u4f9b\u00a0<strong>0.5B<\/strong>\u00a0\u3001<strong>1.5B<\/strong>\u00a0\u3001<strong>3B<\/strong>\u00a0\u3001<strong>7B<\/strong>\u00a0\u3001<strong>14B<\/strong>\u00a0\u3001<strong>32B<\/strong>\u00a0\u548c\u00a0<strong>72B<\/strong>\u00a0\u51717\u79cd\u53c2\u6570\u89c4\u6a21\u7684\u6a21\u578b\uff0c\u5e76\u4e14\u6709\u57fa\u6a21\u578b\u548c\u6307\u4ee4\u5fae\u8c03\u6a21\u578b\u4e24\u79cd\u53d8\u4f53\uff08\u5176\u4e2d\u201c B \u201d\u8868\u793a\u201c\u5341\u4ebf\u201d\uff0c 72B \u5373\u4e3a 720 \u4ebf\uff09<\/li><li>\u5229\u7528\u6211\u4eec\u6700\u65b0\u7684\u6570\u636e\u96c6\u8fdb\u884c\u9884\u8bad\u7ec3\uff0c\u5305\u542b\u591a\u8fbe 18T tokens \uff08\u5176\u4e2d\u201c T \u201d\u8868\u793a\u201c\u4e07\u4ebf\u201d\uff0c 18T \u5373\u4e3a 18 \u4e07\u4ebf\uff09<\/li><li>\u5728\u9075\u5faa\u6307\u4ee4\u3001\u751f\u6210\u957f\u6587\u672c\uff08\u8d85\u8fc7 8K tokens \uff09\u3001\u7406\u89e3\u7ed3\u6784\u5316\u6570\u636e\uff08\u4f8b\u5982\uff0c\u8868\u683c\uff09\u4ee5\u53ca\u751f\u6210\u7ed3\u6784\u5316\u8f93\u51fa\u7279\u522b\u662f JSON \u65b9\u9762\u6709\u4e86\u663e\u8457\u6539\u8fdb<\/li><li>\u66f4\u52a0\u9002\u5e94\u591a\u6837\u5316\u7684\u7cfb\u7edf\u63d0\u793a\uff0c\u589e\u5f3a\u4e86\u89d2\u8272\u626e\u6f14\u7684\u5b9e\u73b0\u548c\u804a\u5929\u673a\u5668\u4eba\u7684\u80cc\u666f\u8bbe\u7f6e\u3002<\/li><li>\u652f\u6301\u6700\u591a\u8fbe\u00a0<strong>128K<\/strong>\u00a0tokens \u7684\u4e0a\u4e0b\u6587\u957f\u5ea6\uff0c\u5e76\u80fd\u751f\u6210\u591a\u8fbe\u00a0<strong>8K<\/strong>\u00a0tokens \u7684\u6587\u672c\u3002<\/li><li>\u652f\u6301\u8d85\u8fc7\u00a0<strong>29<\/strong>\u00a0\u79cd\u8bed\u8a00\uff0c\u5305\u62ec\u4e2d\u6587\u3001\u82f1\u6587\u3001\u6cd5\u6587\u3001\u897f\u73ed\u7259\u6587\u3001\u8461\u8404\u7259\u6587\u3001\u5fb7\u6587\u3001\u610f\u5927\u5229\u6587\u3001\u4fc4\u6587\u3001\u65e5\u6587\u3001\u97e9\u6587\u3001\u8d8a\u5357\u6587\u3001\u6cf0\u6587\u3001\u963f\u62c9\u4f2f\u6587\u7b49\u3002<\/li><\/ul>\n\n\n\n<div class=\"wp-block-image\"><figure class=\"aligncenter is-resized\"><img loading=\"lazy\" src=\"https:\/\/tuso-360.feishu.cn\/space\/api\/box\/stream\/download\/asynccode\/?code=ODRiODlmZDY4ZTkzMjFlNmVjZWIwNzBkMjZlNWFlYzRfUm5iTktyZ2NYamdnMlVuWXdKb2sySlpaR3l0Ujd5V2lfVG9rZW46V1hSWGJWWlFSb1E1OE54b0VnamNiSWdGbk5kXzE3MzQ1MDYxMDM6MTczNDUwOTcwM19WNA\" alt=\"\" width=\"578\" height=\"281\"\/><\/figure><\/div>\n\n\n\n<h2>\u7b80\u4ecb<\/h2>\n\n\n\n<ol><li><strong>\u5168\u9762\u5f00\u6e90<\/strong>\uff1a\u8003\u8651\u5230\u7528\u6237\u5bf910B\u81f330B\u8303\u56f4\u6a21\u578b\u7684\u9700\u6c42\u548c\u79fb\u52a8\u7aef\u5bf93B\u6a21\u578b\u7684\u5174\u8da3\uff0c\u6b64\u6b21\u9664\u4e86\u7ee7\u7eed\u5f00\u6e90Qwen2\u7cfb\u5217\u4e2d\u76840.5B\/1.5B\/7B\/72B\u56db\u6b3e\u6a21\u578b\u5916\uff0cQwen2.5\u7cfb\u5217\u8fd8\u589e\u52a0\u4e86\u4e24\u4e2a\u9ad8\u6027\u4ef7\u6bd4\u7684\u4e2d\u7b49\u89c4\u6a21\u6a21\u578b\u2014\u2014\u00a0<strong>Qwen2.5-14B<\/strong>\u00a0\u548c\u00a0<strong>Qwen2.5-32B<\/strong>\uff0c\u4ee5\u53ca\u4e00\u6b3e\u9002\u5408\u79fb\u52a8\u7aef\u7684\u00a0<strong>Qwen2.5-3B<\/strong>\u3002\u6240\u6709\u6a21\u578b\u5728\u540c\u7c7b\u5f00\u6e90\u4ea7\u54c1\u4e2d\u5747\u5177\u6709\u5f88\u5f3a\u7684\u7ade\u4e89\u529b\uff0c\u4f8b\u5982Qwen2.5-32B\u7684\u6574\u4f53\u8868\u73b0\u8d85\u8d8a\u4e86Qwen2-72B\uff0cQwen2.5-14B\u5219\u9886\u5148\u4e8eQwen2-57B-A14B\u3002<\/li><li><strong>\u66f4\u5927\u89c4\u6a21\u3001\u66f4\u9ad8\u8d28\u91cf\u7684\u9884\u6570\u636e\u8bad\u7ec3\u96c6<\/strong>\uff1a\u6211\u4eec\u7684\u9884\u8bad\u7ec3\u6570\u636e\u96c6\u89c4\u6a21\u4ece 7T tokens \u6269\u5c55\u5230\u4e86\u00a0<strong>18T<\/strong>\u00a0tokens\u3002<\/li><li><strong>\u77e5\u8bc6\u50a8\u5907\u5347\u7ea7<\/strong>\uff1aQwen2.5\u7684\u77e5\u8bc6\u6db5\u76d6\u66f4\u5e7f\u3002\u5728MMLU\u57fa\u51c6\u4e2d\uff0cQwen2.5-7B \u548c 72B\u7684\u5f97\u5206\u76f8\u8f83\u4e8eQwen2\u5206\u522b\u4ece70.3\u63d0\u5347\u5230\u00a0<strong>74.2<\/strong>\uff0c\u548c\u4ece84.2\u63d0\u5347\u5230\u00a0<strong>86.1<\/strong>\u3002\u6b64\u5916\uff0cQwen2.5\u8fd8\u5728 GPQA\u3001MMLU-Pro\u3001MMLU-redux \u548c ARC-c \u7b49\u591a\u4e2a\u57fa\u51c6\u6d4b\u8bd5\u4e2d\u6709\u4e86\u660e\u663e\u63d0\u5347\u3002<\/li><li><strong>\u4ee3\u7801\u80fd\u529b\u589e\u5f3a<\/strong>\uff1a\u5f97\u76ca\u4e8eQwen2.5-Coder\u7684\u7a81\u7834\uff0cQwen2.5\u5728\u4ee3\u7801\u751f\u6210\u80fd\u529b\u4e0a\u4e5f\u5927\u5e45\u63d0\u5347\u3002Qwen2.5-72B-Instruct\u5728LiveCodeBench\uff082305-2409\uff09\u3001MultiPL-E\u548cMBPP\u4e2d\u7684\u5206\u522b\u5f97\u5206\u00a0<strong>55.5<\/strong>\u3001<strong>75.1<\/strong>\u00a0\u548c\u00a0<strong>88.2<\/strong>\uff0c\u4f18\u4e8eQwen2-72B-Instruct\u768432.2\u300169.2\u548c80.2\u3002<\/li><li><strong>\u6570\u5b66\u80fd\u529b\u63d0\u5347<\/strong>\uff1a\u5f15\u5165\u4e86Qwen2-math\u7684\u6280\u672f\u540e\uff0cQwen2.5\u7684\u6570\u5b66\u63a8\u7406\u8868\u73b0\u4e5f\u6709\u4e86\u5feb\u901f\u63d0\u5347\u3002\u5728MATH\u57fa\u51c6\u6d4b\u8bd5\u4e2d\uff0cQwen2.5-7B\/72B-Instruct\u5f97\u5206\u4eceQwen2-7B\/72B-Instruct\u768452.9\/69.0\u4e0a\u5347\u5230\u4e86\u00a0<strong>75.5\/83.1<\/strong>\u3002<\/li><li><strong>\u66f4\u7b26\u5408\u4eba\u7c7b\u504f\u597d<\/strong>\uff1aQwen2.5\u751f\u6210\u7684\u5185\u5bb9\u66f4\u52a0\u8d34\u8fd1\u4eba\u7c7b\u7684\u504f\u597d\u3002\u5177\u4f53\u6765\u770b\uff0cQwen2.5-72B-Instruct\u7684Arena-Hard\u5f97\u5206\u4ece\u00a0<strong>48.1<\/strong>\u00a0\u5927\u5e45\u63d0\u5347\u81f3\u00a0<strong>81.2<\/strong>\uff0cMT-Bench\u5f97\u5206\u4e5f\u4ece\u00a0<strong>9.12<\/strong>\u00a0\u63d0\u5347\u5230\u4e86\u00a0<strong>9.35<\/strong>\uff0c\u4e0e\u4e4b\u524d\u7684Qwen2-72B\u76f8\u6bd4\u63d0\u5347\u663e\u8457\u3002<\/li><li><strong>\u5176\u4ed6\u6838\u5fc3\u80fd\u529b\u63d0\u5347<\/strong>\uff1aQwen2.5\u5728\u00a0<strong>\u6307\u4ee4\u8ddf\u968f<\/strong>\u3001\u751f\u6210\u00a0<strong>\u957f\u6587\u672c<\/strong>\uff08\u4ece1K\u5347\u7ea7\u5230\u00a0<strong>8K tokens<\/strong>\uff09\u3001\u7406\u89e3\u00a0<strong>\u7ed3\u6784\u5316\u6570\u636e<\/strong>\uff08\u5982\u8868\u683c\uff09\uff0c\u4ee5\u53ca\u751f\u6210\u00a0<strong>\u7ed3\u6784\u5316\u8f93\u51fa<\/strong>\uff08\u5c24\u5176\u662fJSON\uff09\u4e0a\u90fd\u6709\u975e\u5e38\u660e\u663e\u7684\u8fdb\u6b65\u3002\u6b64\u5916\uff0cQwen2.5\u80fd\u591f\u66f4\u597d\u54cd\u5e94\u591a\u6837\u5316\u7684\u00a0<strong>\u7cfb\u7edf\u63d0\u793a<\/strong>\uff0c\u7528\u6237\u53ef\u4ee5\u7ed9\u6a21\u578b\u8bbe\u7f6e\u00a0<strong>\u7279\u5b9a\u89d2\u8272<\/strong>\u00a0\u6216\u00a0<strong>\u81ea\u5b9a\u4e49\u6761\u4ef6<\/strong>\u3002<\/li><\/ol>\n\n\n\n<h1 id=\"\u6a21\u578b\u57fa\u7840\u4fe1\u606f\">\u6a21\u578b\u57fa\u7840\u4fe1\u606f<\/h1>\n\n\n\n<p>\u672c\u6b21\u53d1\u5e03\u7684 Qwen2.5 \u8bed\u8a00\u6a21\u578b\u7cfb\u5217\u5305\u62ec\u4e03\u4e2a\u5f00\u6e90\u6a21\u578b\uff0c\u89c4\u6a21\u4ece 0.5B \u5230 72B \u4e0d\u7b49\u3002\u5927\u591a\u6570\u6a21\u578b\u652f\u6301 128K\uff08131,072\uff09\u4e2a token \u7684\u4e0a\u4e0b\u6587\u957f\u5ea6\uff0c\u5e76\u80fd\u751f\u6210 8K token \u7684\u6587\u672c\uff0c\u652f\u6301\u957f\u7bc7\u5185\u5bb9\u521b\u4f5c\u3002\u9664\u90e8\u5206\u7279\u6b8a\u7248\u672c\u5916\uff0c\u6a21\u578b\u4e3b\u8981\u91c7\u7528 Apache 2.0 \u5f00\u6e90\u8bb8\u53ef\u534f\u8bae\uff0c\u800c Qwen2.5-3B \u548c Qwen2.5-72B \u5206\u522b\u4f7f\u7528 Qwen Research \u8bb8\u53ef\u534f\u8bae \u548c Qwen \u8bb8\u53ef\u534f\u8bae\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><img loading=\"lazy\" width=\"1024\" height=\"604\" src=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-64-1024x604.png\" alt=\"\" class=\"wp-image-23239\" srcset=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-64-1024x604.png 1024w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-64-300x177.png 300w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-64-768x453.png 768w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-64.png 1200w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<h2 id=\"\u6a21\u578b\u6027\u80fd\">\u6a21\u578b\u6027\u80fd<\/h2>\n\n\n\n<h3 id=\"qwen25\">Qwen2.5<\/h3>\n\n\n\n<p>\u4e3a\u4e86\u5c55\u793a Qwen2.5 \u7684\u80fd\u529b\uff0c\u6211\u4eec\u7528\u6211\u4eec\u6700\u5927\u7684\u5f00\u6e90\u6a21\u578b\u00a0<strong>Qwen2.5-72B<\/strong>\u00a0\u2014\u2014 \u4e00\u4e2a\u62e5\u6709 720 \u4ebf\u53c2\u6570\u7684\u7a20\u5bc6 decoder-only \u8bed\u8a00\u6a21\u578b\u2014\u2014\u4e0e\u9886\u5148\u7684\u5f00\u6e90\u6a21\u578b\u5982 Llama-3.1-70B \u548c Mistral-Large-V2\u8fdb\u884c\u4e86\u57fa\u51c6\u6d4b\u8bd5\u3002<strong>\u6211\u4eec\u5728\u591a\u4e2a\u57fa\u51c6\u6d4b\u8bd5\u4e2d\u5c55\u793a\u4e86\u7ecf\u8fc7\u6307\u4ee4\u8c03\u4f18\u7684\u7248\u672c\u7684\u7efc\u5408\u7ed3\u679c\uff0c\u8bc4\u4f30\u4e86\u6a21\u578b\u7684\u80fd\u529b\u548c\u4eba\u7c7b\u504f\u597d\u3002<\/strong><\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><img loading=\"lazy\" width=\"1024\" height=\"564\" src=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-65-1024x564.png\" alt=\"\" class=\"wp-image-23242\" srcset=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-65-1024x564.png 1024w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-65-300x165.png 300w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-65-768x423.png 768w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-65.png 1156w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<p>\u9664\u4e86\u6307\u4ee4\u5fae\u8c03\u7684\u6a21\u578b\u4e4b\u5916\uff0c\u6211\u4eec\u8fd8\u53d1\u73b0\uff0c\u6211\u4eec\u7684\u65d7\u8230\u5f00\u6e90\u6a21\u578b\u00a0<strong>Qwen2.5-72B<\/strong>\u00a0\u7684\u57fa\u7840\u8bed\u8a00\u6a21\u578b\u6027\u80fd\u8fbe\u5230\u4e86\u9876\u7ea7\u6c34\u51c6\uff0c\u5373\u4fbf\u662f\u5728\u4e0e Llama-3-405B \u8fd9\u6837\u66f4\u5927\u7684\u6a21\u578b\u5bf9\u6bd4\u65f6\u4e5f\u662f\u5982\u6b64\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><img loading=\"lazy\" width=\"1024\" height=\"604\" src=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-66-1024x604.png\" alt=\"\" class=\"wp-image-23245\" srcset=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-66-1024x604.png 1024w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-66-300x177.png 300w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-66-768x453.png 768w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-66.png 1111w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<p>Qwen2.5 \u7684\u4e00\u4e2a\u91cd\u8981\u66f4\u65b0\u662f\u91cd\u65b0\u5f15\u5165\u4e86\u6211\u4eec\u7684 140 \u4ebf\u53c2\u6570\u548c 320 \u4ebf\u53c2\u6570\u6a21\u578b\uff0c\u5373\u00a0<strong>Qwen2.5-14B<\/strong>\u00a0\u548c\u00a0<strong>Qwen2.5-32B<\/strong>\u3002\u8fd9\u4e9b\u6a21\u578b\u5728\u591a\u6837\u5316\u7684\u4efb\u52a1\u4e2d\u8d85\u8d8a\u4e86\u540c\u7b49\u89c4\u6a21\u6216\u66f4\u5927\u89c4\u6a21\u7684\u57fa\u7ebf\u6a21\u578b\uff0c\u4f8b\u5982 Phi-3.5-MoE-Instruct \u548c Gemma2-27B-IT\u3002 \u5b83\u4eec\u5728\u6a21\u578b\u5927\u5c0f\u548c\u80fd\u529b\u4e4b\u95f4\u8fbe\u5230\u4e86\u6700\u4f73\u5e73\u8861\uff0c\u63d0\u4f9b\u4e86\u5339\u914d\u751a\u81f3\u8d85\u8fc7\u4e00\u4e9b\u8f83\u5927\u6a21\u578b\u7684\u6027\u80fd\u3002\u6b64\u5916\uff0c\u6211\u4eec\u7684\u57fa\u4e8e API \u7684\u6a21\u578b\u00a0<strong>Qwen2.5-Turbo<\/strong>\u00a0\u76f8\u6bd4\u8fd9\u4e24\u4e2a\u5f00\u6e90\u6a21\u578b\u63d0\u4f9b\u4e86\u6781\u5177\u7ade\u4e89\u529b\u7684\u6027\u80fd\uff0c\u540c\u65f6\u63d0\u4f9b\u4e86\u6210\u672c\u6548\u76ca\u9ad8\u4e14\u5feb\u901f\u7684\u670d\u52a1\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-large\"><img loading=\"lazy\" width=\"1024\" height=\"604\" src=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-67-1024x604.png\" alt=\"\" class=\"wp-image-23247\" srcset=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-67-1024x604.png 1024w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-67-300x177.png 300w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-67-768x453.png 768w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-67.png 1053w\" sizes=\"(max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<p>\u8fd1\u6765\u4e5f\u51fa\u73b0\u4e86\u660e\u663e\u7684\u8f6c\u5411\u5c0f\u578b\u8bed\u8a00\u6a21\u578b\uff08SLMs\uff09\u7684\u8d8b\u52bf\u3002\u5c3d\u7ba1\u5386\u53f2\u4e0a\u5c0f\u578b\u8bed\u8a00\u6a21\u578b\uff08SLMs\uff09\u7684\u8868\u73b0\u4e00\u76f4\u843d\u540e\u4e8e\u5927\u578b\u8bed\u8a00\u6a21\u578b\uff08LLMs\uff09\uff0c\u4f46<strong>\u4e8c\u8005\u4e4b\u95f4\u7684\u6027\u80fd\u5dee\u8ddd\u6b63\u5728\u8fc5\u901f\u7f29\u5c0f\u3002\u503c\u5f97\u6ce8\u610f\u7684\u662f\uff0c\u5373\u4f7f\u662f\u53ea\u6709\u5927\u7ea6 30 \u4ebf\u53c2\u6570\u7684\u6a21\u578b\u73b0\u5728\u4e5f\u80fd\u53d6\u5f97\u9ad8\u5ea6\u7ade\u4e89\u529b\u7684\u7ed3\u679c<\/strong>\u3002\u9644\u5e26\u7684\u56fe\u8868\u663e\u793a\u4e86\u4e00\u4e2a\u91cd\u8981\u7684\u8d8b\u52bf\uff1a\u5728 MMLU \u4e2d\u5f97\u5206\u8d85\u8fc7 65 \u7684\u65b0\u578b\u6a21\u578b\u6b63\u53d8\u5f97\u8d8a\u6765\u8d8a\u5c0f\uff0c\u8fd9\u51f8\u663e\u4e86\u8bed\u8a00\u6a21\u578b\u7684\u77e5\u8bc6\u5bc6\u5ea6\u589e\u957f\u901f\u5ea6\u52a0\u5feb\u3002\u7279\u522b\u503c\u5f97\u4e00\u63d0\u7684\u662f\uff0c\u6211\u4eec\u7684\u00a0<strong>Qwen2.5-3B<\/strong>\u00a0\u6210\u4e3a\u8fd9\u4e00\u8d8b\u52bf\u7684\u4e00\u4e2a\u5178\u578b\u4f8b\u5b50\uff0c<strong>\u5b83\u4ec5\u51ed\u7ea6 30 \u4ebf\u53c2\u6570\u5c31\u5b9e\u73b0\u4e86\u4ee4\u4eba\u5370\u8c61\u6df1\u523b\u7684\u6027\u80fd\uff0c\u5c55\u793a\u4e86\u5176\u76f8\u5bf9\u4e8e\u524d\u8f88\u6a21\u578b\u7684\u9ad8\u6548\u6027\u548c\u80fd\u529b\u3002<\/strong><\/p>\n\n\n\n<figure class=\"wp-block-image size-large is-resized\"><img loading=\"lazy\" src=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-68-1024x617.png\" alt=\"\" class=\"wp-image-23249\" width=\"626\" height=\"376\" srcset=\"http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-68-1024x617.png 1024w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-68-300x181.png 300w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-68-768x462.png 768w, http:\/\/139.9.1.231\/wp-content\/uploads\/2024\/12\/image-68.png 1068w\" sizes=\"(max-width: 626px) 100vw, 626px\" \/><\/figure>\n\n\n\n<p>\u9664\u4e86\u5728\u57fa\u51c6\u8bc4\u4f30\u4e2d\u53d6\u5f97\u7684\u663e\u8457\u589e\u5f3a\u5916\uff0c\u6211\u4eec\u8fd8\u6539\u8fdb\u4e86\u6211\u4eec\u7684\u540e\u8bad\u7ec3\u65b9\u6cd5\u3002\u6211\u4eec\u7684\u56db\u4e2a\u4e3b\u8981\u66f4\u65b0\u5305\u62ec\u652f\u6301\u6700\u957f\u53ef\u8fbe 8K \u6807\u8bb0\u7684\u957f\u6587\u672c\u751f\u6210\uff0c\u5927\u5e45\u63d0\u5347\u4e86\u5bf9\u7ed3\u6784\u5316\u6570\u636e\u7684\u7406\u89e3\u80fd\u529b\uff0c\u751f\u6210\u7ed3\u6784\u5316\u8f93\u51fa\uff08\u5c24\u5176\u662f JSON \u683c\u5f0f\uff09\u66f4\u52a0\u53ef\u9760\uff0c\u5e76\u4e14\u5728\u591a\u6837\u5316\u7684\u7cfb\u7edf\u63d0\u793a\u4e0b\u7684\u8868\u73b0\u5f97\u5230\u4e86\u52a0\u5f3a\uff0c\u8fd9\u6709\u52a9\u4e8e\u6709\u6548\u8fdb\u884c\u89d2\u8272\u626e\u6f14\u3002<\/p>\n","protected":false},"excerpt":{"rendered":"<p>\ud83e\udd17\u00a0Hugging Face\u00a0\u00a0 | \u00a0\u00a0\ud83e\udd16\u00a0ModelScope\u00a0\u00a0 | \u00a0\u00a0 \ud83d\udcd1 Paper (\u62a5\u544a\u8fd8\u672a\u53d1 &hellip; <a href=\"http:\/\/139.9.1.231\/index.php\/2024\/12\/18\/qwen2-5-report\/\" class=\"more-link\">\u7ee7\u7eed\u9605\u8bfb<span class=\"screen-reader-text\">Qwen2.5 -\u6280\u672f\u62a5\u544a<\/span><\/a><\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":[],"categories":[21,4,9,38],"tags":[],"_links":{"self":[{"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/posts\/23228"}],"collection":[{"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/comments?post=23228"}],"version-history":[{"count":18,"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/posts\/23228\/revisions"}],"predecessor-version":[{"id":23251,"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/posts\/23228\/revisions\/23251"}],"wp:attachment":[{"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/media?parent=23228"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/categories?post=23228"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/139.9.1.231\/index.php\/wp-json\/wp\/v2\/tags?post=23228"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}