{"id":245293,"date":"2025-10-15T11:02:22","date_gmt":"2025-10-15T03:02:22","guid":{"rendered":"https:\/\/www.hkubs.hku.hk\/media\/hku-business-school-releases-latest-report-on-ais-advanced-reasoning-capabilities\/"},"modified":"2025-10-15T11:04:05","modified_gmt":"2025-10-15T03:04:05","slug":"hku-business-school-releases-latest-report-on-ais-advanced-reasoning-capabilities","status":"publish","type":"hkubs-media","link":"https:\/\/www.hkubs.hku.hk\/sc\/media\/press-release\/hku-business-school-releases-latest-report-on-ais-advanced-reasoning-capabilities\/","title":{"rendered":"\u6e2f\u5927\u7ecf\u7ba1\u5b66\u9662\u6700\u65b0\u6d4b\u8bc4\uff1aAI\u9ad8\u9636\u63a8\u7406\u80fd\u529b\uff0c\u54ea\u5bb6\u6700\u5f3a\uff1f"},"content":{"rendered":"<p>\u6e2f\u5927\u7ecf\u7ba1\u5b66\u9662\u4eca\u65e5\u53d1\u8868<strong>\u300aAI\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u6d4b\u8bc4\u62a5\u544a\u300b<\/strong>\uff0c\u9488\u5bf9\u9009\u5b9a\u7684AI\u5927\u8bed\u8a00\u6a21\u578b\uff08LLM\uff09\u5728\u4e2d\u6587\u8bed\u5883\u4e0b\u7684\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u8fdb\u884c\u6d4b\u8bc4\uff0c\u4ee5\u5168\u9762\u68c0\u89c6AI\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u7684\u53d1\u5c55\u73b0\u72b6\u3002<\/p>\n<p>2025\u5e74\u4ee5\u6765\uff0cAI\u5927\u8bed\u8a00\u6a21\u578b\u4ece\u201c\u80fd\u5bf9\u8bdd\u201d\u5411\u201c\u4f1a\u601d\u8003\u201d\u5feb\u901f\u6f14\u8fdb\u3002 \u7136\u800c\u5728\u9700\u8981\u590d\u6742\u63a8\u7406\u80fd\u529b\u7684\u573a\u666f\u4e2d\uff0cAI\u7684\u63a8\u7406\u80fd\u529b\u53c2\u5dee\u4e0d\u9f50\uff0c\u5305\u62ec\u5bf9\u56fe\u7247\u548c\u6587\u5b57\u7b49\u8de8\u6a21\u6001\u4fe1\u606f\u7684\u6574\u5408\u5206\u6790\u80fd\u529b\uff0c\u6216\u9762\u5bf9\u975e\u5e38\u89c4\u6027\u590d\u6742\u9898\u76ee\u65f6\u7684\u521b\u65b0\u63a8\u7406\u80fd\u529b\u3002 \u6709\u9274\u4e8e\u6b64\uff0c<strong>\u6e2f\u5927\u7ecf\u7ba1\u5b66\u9662\u521b\u65b0\u53ca\u4fe1\u606f\u7ba1\u7406\u5b66\u6559\u6388\u517c\u590f\u5229\u83b1\u4f09\u4fea\u57fa\u91d1\u6559\u6388\u848b\u9547\u8f89\u7387\u9886\u4eba\u5de5\u667a\u80fd\u8bc4\u4f30\u5b9e\u9a8c\u5ba4\uff08<\/strong><strong>AIEL<\/strong><strong>\uff09<\/strong>\uff08<span><a href=\"https:\/\/hkubs.hku.hk\/aimodelrankings\">https:\/\/hkubs.hku.hk\/aimodelrankings<\/a><\/span>\uff09\u7814\u7a76\u4eba\u5458\uff0c\u9996\u6b21\u6784\u5efa\u591a\u6a21\u6001\u63a8\u7406\u548c\u5965\u8d5b\u63a8\u7406\u7efc\u5408\u8bc4\u6d4b\u4f53\u7cfb\uff0c\u4ee5\u7cfb\u7edf\u6027\u3001\u5b9a\u91cf\u5316\u7684\u65b9\u5f0f\u9488\u5bf92025\u5e74\u4eba\u5de5\u667a\u80fd\u6280\u672f\u7684\u6838\u5fc3\u53d1\u5c55\u74f6\u9888\u2014\u2014\u9ad8\u9636\u63a8\u7406\u80fd\u529b\uff0c\u8fdb\u884c\u4e86\u5168\u9762\u6df1\u5165\u7684\u73b0\u72b6\u6d4b\u8bc4\u3002 \u6d4b\u8bc4\u5bf9\u8c61\u8986\u76d6\u4e2d\u7f8e\u4e24\u56fd\u622a\u6b622025\u5e7410\u6708\u4e2d\u65ec\u53d1\u5e03\u7684\u517137\u6b3e\u5927\u8bed\u8a00\u6a21\u578b\uff08\u542b14\u4e2a\u63a8\u7406\u6a21\u578b\u300120\u4e2a\u901a\u7528\u6a21\u578b\u548c3\u4e2a\u4e00\u4f53\u5316\u7cfb\u7edf\uff09\u3002<\/p>\n<p>\u6d4b\u8bc4\u7ed3\u679c\u663e\u793a\uff1a<\/p>\n<ul>\n<li>\u5728\u201c\u591a\u6a21\u6001\u63a8\u7406\u201d\u9886\u57df\uff0cGPT\u7cfb\u5217\u6301\u7eed\u9886\u5148\uff0c\u4ee5\u8c46\u53051.5 Pro\uff08\u601d\u8003\u6a21\u5f0f\uff09\u4e3a\u9996\u7684\u9876\u5c16\u56fd\u4ea7\u6a21\u578b\uff0c\u4e5f\u5df2\u6210\u529f\u8dfb\u8eab\u5168\u7403\u7b2c\u4e00\u68af\u961f\u3002<\/li>\n<li>\u5728\u66f4\u9ad8\u96be\u5ea6\u7684\u201c\u5965\u8d5b\u63a8\u7406\u201d\u9886\u57df\uff0c\u5219\u7531\u7f8e\u56fd\u6a21\u578b\u6574\u4f53\u4e3b\u5bfc\uff0c\u5176\u4e2dGPT-5\uff08\u601d\u8003\u6a21\u5f0f\uff09\u5448\u73b0\u65ad\u5c42\u4f18\u52bf\uff0c\u800cGemini 2.5 Pro\u5219\u7d27\u968f\u5176\u540e\u3002<\/li>\n<li>\u6574\u4f53\u800c\u8a00\uff0c\u6b64\u6b21\u6d4b\u8bc4\u4f53\u73b0\u4e86\u4e00\u4e2a\u6e05\u6670\u7684\u884c\u4e1a\u8d8b\u52bf\uff1a\u5728\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u9886\u57df\uff0c\u201c\u63a8\u7406\u6a21\u578b\u201d\u8868\u73b0\u4f18\u4e8e\u201c\u901a\u7528\u6a21\u578b\u201d\uff0c\u4e24\u8005\u68af\u5ea6\u5dee\u5f02\u660e\u663e\u3002 \u8fd9\u4e0e\u4eba\u5de5\u667a\u80fd\u4ea7\u4e1a\u7684\u53d1\u5c55\u89c4\u5f8b\u9ad8\u5ea6\u5951\u5408\u2014\u2014\u884c\u4e1a\u6b63\u7ecf\u5386\u4ece\u8ffd\u6c42\u201c\u5168\u573a\u666f\u901a\u7528\u80fd\u529b\u8986\u76d6\u201d\u8f6c\u5411\u805a\u7126\u201c\u4e13\u7528\u573a\u666f\u7a81\u7834\u4e0e\u6df1\u5ea6\u6548\u80fd\u4f18\u5316\u201d\uff0c\u6280\u672f\u53d1\u5c55\u4e5f\u5728\u4ece\u201c\u5e7f\u5ea6\u6269\u5f20\u201d\u8fc8\u5411\u201c\u6df1\u5ea6\u7cbe\u8015\u201d\u7684\u65b0\u9636\u6bb5\u3002<\/li>\n<\/ul>\n<p><strong>\u848b\u9547\u8f89\u6559\u6388<\/strong>\u8868\u793a\uff1a\u201c\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u5bf9AI\u5728\u6559\u80b2\u3001\u79d1\u7814\u53ca\u5546\u4e1a\u51b3\u7b56\u7b49\u9886\u57df\u7684\u5e94\u7528\u62d3\u5c55\u81f3\u5173\u91cd\u8981\u3002 \u6b64\u7814\u7a76\u65e8\u5728\u63ed\u793a\u9ad8\u9636\u4eba\u5de5\u667a\u80fd\u6280\u672f\u7684\u53d1\u5c55\u73b0\u72b6\uff0c\u4ee4\u884c\u4e1a\u80fd\u591f\u7cbe\u51c6\u5b9a\u4f4d\u6280\u672f\u74f6\u9888\uff0c\u52a0\u901f\u901a\u7528\u4eba\u5de5\u667a\u80fd\u5728\u9ad8\u8981\u6c42\u9886\u57df\u7684\u843d\u5730\u5e94\u7528\uff0c\u6700\u7ec8\u63a8\u52a8AI\u4ece\u5bf9\u8bdd\u52a9\u624b\u8f6c\u578b\u6210\u4e3a\u66f4\u52a0\u9ad8\u7ea7\u7684\u667a\u80fd\u4f19\u4f34\u3002 \u201d<\/p>\n<p><strong><u>\u6d4b\u8bc4\u65b9\u6cd5<\/u><\/strong><\/p>\n<p>\u8be5\u7814\u7a76\u7efc\u5408\u6d4b\u8bc4\u4e86\u5927\u8bed\u8a00\u6a21\u578b\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u7684\u4e24\u4e2a\u6838\u5fc3 \u00ad&#8211; \u591a\u6a21\u6001\u63a8\u7406\u80fd\u529b\u548c\u5965\u8d5b\u63a8\u7406\u80fd\u529b\u3002<\/p>\n<ul>\n<li><strong>\u591a\u6a21\u6001\u63a8\u7406\u80fd\u529b<\/strong>\u662f\u6307\u6a21\u578b\u5728\u6574\u5408\u6587\u672c\u3001\u56fe\u50cf\u3001\u6570\u636e\u56fe\u8868\u7b49\u591a\u79cd\u4fe1\u606f\u5f62\u5f0f\u8fdb\u884c\u8de8\u6a21\u6001\u5173\u8054\u5206\u6790\u4e0e\u903b\u8f91\u63a8\u5bfc\u65f6\u5c55\u793a\u7684\u80fd\u529b<strong>\u3002 <\/strong>\u5728\u6559\u80b2\u573a\u666f\u4e2d\uff0c\u5b83\u80fd\u5e2e\u52a9\u5b66\u751f\u7ed3\u5408\u6559\u6750\u6587\u672c\u4e0e\u56fe\u6807\u7406\u89e3\u79d1\u5b66\u539f\u7406; \u5728\u5546\u4e1a\u5206\u6790\u4e2d\uff0c\u53ef\u52a9\u529b\u4ece\u4e1a\u8005\u5339\u914d\u5e02\u573a\u6587\u5b57\u63cf\u8ff0\u4e0e\u9500\u552e\u56fe\u8868\uff0c\u9884\u5224\u6d88\u8d39\u8d8b\u52bf\u3002 \u8fd9\u79cd\u80fd\u529b\u662fAI\u5e94\u5bf9\u590d\u6742\u73b0\u5b9e\u4efb\u52a1\u7684\u201c\u5fc5\u5907\u7d20\u517b\u201d\u3002<\/li>\n<li><strong>\u5965\u8d5b\u63a8\u7406\u80fd\u529b<\/strong>\u5219\u901a\u8fc7\u56fd\u9645\u6570\u5b66\u5965\u6797\u5339\u514b\uff08IMO\uff09\u7b49\u6743\u5a01\u8d5b\u4e8b\u7684\u9ad8\u96be\u5ea6\u9898\u76ee\uff0c\u68c0\u9a8c\u6a21\u578b\u5728\u590d\u6742\u903b\u8f91\u7ed3\u6784\u3001\u591a\u6b65\u63a8\u5bfc\u4e0e\u521b\u9020\u6027\u601d\u7ef4\u4e0a\u7684\u8868\u73b0\u3002 \u8fd9\u7c7b\u9898\u76ee\u5f80\u5f80\u6ca1\u6709\u552f\u4e00\u89e3\u6cd5\uff0c\u66f4\u8003\u9a8cAI\u8df3\u51fa\u5e38\u89c4\u3001\u5bfb\u627e\u6700\u4f18\u89e3\u7684\u80fd\u529b\uff0c\u662f\u8861\u91cf\u5176\u201c\u6df1\u5ea6\u667a\u6167\u201d\u7684\u8bd5\u91d1\u77f3\u3002<\/li>\n<\/ul>\n<p><strong><u>\u591a\u6a21\u6001\u63a8\u7406\u80fd\u529b\u6392\u540d<\/u><\/strong><\/p>\n<p>\u6839\u636e\u6d4b\u8bc4\u7ed3\u679c\uff0c\u4e0d\u540c\u5927\u8bed\u8a00\u6a21\u578b\u5728\u591a\u6a21\u6001\u63a8\u7406\u80fd\u529b\u4e0a\u7684\u8868\u73b0\u6709\u660e\u663e\u5206\u5c42\u3002 \u5176\u4e2d\uff0cGPT\u7cfb\u5217\u572885\u5206\u4ee5\u4e0a\u533a\u95f4\u7684\u4e94\u4e2a\u5934\u90e8\u6a21\u578b\u4e2d\u5360\u636e\u56db\u5e2d\uff0c\u5f62\u6210\u5b8c\u6574\u7684\u9876\u5c16\u80fd\u529b\u94fe\u6761\u3002 \u8c46\u53051.5 Pro\uff08\u601d\u8003\u6a21\u5f0f\uff09\u662f\u552f\u4e00\u8fdb\u5165\u524d\u4e94\u7684\u56fd\u4ea7\u6a21\u578b\uff0c\u5176\u901a\u7528\u4e0e\u601d\u8003\u6a21\u5f0f\u5dee\u8ddd\u6781\u5c0f\uff0c\u8bf4\u660e\u5176\u591a\u6a21\u6001\u63a8\u7406\u80fd\u529b\u5df2\u666e\u904d\u8fbe\u56fd\u9645\u9876\u5c16\u6c34\u5e73\u3002<\/p>\n<p>\u4ece\u6a21\u578b\u7c7b\u578b\u770b\uff0c\u548c\u901a\u7528\u6a21\u578b\u76f8\u6bd4\uff0c\u540c\u516c\u53f8\u7684\u63a8\u7406\u6a21\u578b\u5728\u590d\u6742\u4efb\u52a1\u4e2d\u5c55\u73b0\u51fa\u4e00\u5b9a\u7684\u4f18\u52bf\u3002<\/p>\n<table width=\"491\">\n<tbody>\n<tr>\n<td width=\"75\"><strong>\u6392\u540d<\/strong><\/td>\n<td width=\"236\"><strong>\u6a21\u578b\u540d\u79f0<\/strong><\/td>\n<td width=\"180\"><strong>\u591a\u6a21\u6001\u63a8\u7406\u80fd\u529b<\/strong><\/p>\n<p><strong>\u51c6\u786e\u7387\u5f97\u5206<\/strong><\/td>\n<\/tr>\n<tr>\n<td width=\"75\">1<\/td>\n<td width=\"236\">GPT-5\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/td>\n<td width=\"180\">91<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">2<\/td>\n<td width=\"236\">GPT-4.1<\/td>\n<td width=\"180\">90<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">3<\/td>\n<td width=\"236\">GPT-o3<\/td>\n<td width=\"180\">87<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">4<\/td>\n<td width=\"236\">\u8c46\u5305<span>1.5 Pro<\/span><span>\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/span><\/td>\n<td width=\"180\">85<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">4<\/td>\n<td width=\"236\">GPT<span>-5\uff08\u81ea\u52a8\u6a21\u5f0f\uff09<\/span><\/td>\n<td width=\"180\">85<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">6<\/td>\n<td width=\"236\">GPT-4o<\/td>\n<td width=\"180\">84<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">7<\/td>\n<td width=\"236\">Claude 4 Opus<span>\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/span><\/td>\n<td width=\"180\">83<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">8<\/td>\n<td width=\"236\">\u8c46\u5305<span>1.5 Pro<\/span><\/td>\n<td width=\"180\">82<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">8<\/td>\n<td width=\"236\">Grok 3<span>\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/span><\/td>\n<td width=\"180\">82<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">10<\/td>\n<td width=\"236\">\u901a\u4e49\u5343\u95ee<span>3<\/span><\/td>\n<td width=\"180\">81<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">11<\/td>\n<td width=\"236\">Kimi-k1.5<\/td>\n<td width=\"180\">80<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">11<\/td>\n<td width=\"236\">\u65e5\u65e5\u65b0<span> V6<\/span><span>\u63a8\u7406<\/span><\/td>\n<td width=\"180\">80<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">11<\/td>\n<td width=\"236\">Step R1-V-Mini\uff08\u9636\u8dc3 R1-V-Mini\uff09<\/td>\n<td width=\"180\">80<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">14<\/td>\n<td width=\"236\">Grok<span> 4<\/span><\/td>\n<td width=\"180\">79<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">14<\/td>\n<td width=\"236\">GPT-o4 mini<\/td>\n<td width=\"180\">79<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">14<\/td>\n<td width=\"236\">\u6df7\u5143<span>-T1<\/span><\/td>\n<td width=\"180\">79<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">17<\/td>\n<td width=\"236\">GLM-4-plus\uff08\u667a\u8c31-4-Plus\uff09<\/td>\n<td width=\"180\">78<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">17<\/td>\n<td width=\"236\">\u901a\u4e49\u5343\u95ee<span>3<\/span><span>\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/span><\/td>\n<td width=\"180\">78<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">19<\/td>\n<td width=\"236\">Gemini 2.5 Flash<\/td>\n<td width=\"180\">77<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">19<\/td>\n<td width=\"236\">GLM-Z1-Air\uff08\u667a\u8c31-Z1-Air\uff09<\/td>\n<td width=\"180\">77<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">21<\/td>\n<td width=\"236\">Llama 3.3 70B<\/td>\n<td width=\"180\">76<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">22<\/td>\n<td width=\"236\">\u65e5\u65e5\u65b0<span> V6 Pro<\/span><\/td>\n<td width=\"180\">75<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">22<\/td>\n<td width=\"236\">Gemini 2.5 Pro<\/td>\n<td width=\"180\">75<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">23<\/td>\n<td width=\"236\">\u6587\u5fc3\u4e00\u8a00<span>4.5-Turbo<\/span><\/td>\n<td width=\"180\">74<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">24<\/td>\n<td width=\"236\">Step 2\uff08\u9636\u8dc32\uff09<\/td>\n<td width=\"180\">73<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">26<\/td>\n<td width=\"236\">\u6df7\u5143<span>-TurboS<\/span><\/td>\n<td width=\"180\">71<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">26<\/td>\n<td width=\"236\">Claude 4 Opus<\/td>\n<td width=\"180\">71<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">28<\/td>\n<td width=\"236\">Spark 4.0 Ultra\uff08\u8baf\u98de\u661f\u706b 4.0 Ultra\uff09<\/td>\n<td width=\"180\">68<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">28<\/td>\n<td width=\"236\">MiniMax-01<\/td>\n<td width=\"180\">68<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">30<\/td>\n<td width=\"236\">Baichuan4-Turbo\uff08\u767e\u5ddd4-Turbo\uff09<\/td>\n<td width=\"180\">67<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">31<\/td>\n<td width=\"236\">Grok 3<\/td>\n<td width=\"180\">66<\/td>\n<\/tr>\n<tr>\n<td width=\"75\">32<\/td>\n<td width=\"236\">Kimi<\/td>\n<td width=\"180\">63<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>\u8868 1\uff1a\u591a\u6a21\u6001\u63a8\u7406\u80fd\u529b\u6392\u540d<\/p>\n<p><strong><u>\u5965\u8d5b\u63a8\u7406\u80fd\u529b\u6392\u540d<\/u><\/strong><\/p>\n<p>\u6839\u636e\u8bc4\u6d4b\u7ed3\u679c\uff0c\u7f8e\u56fd\u5927\u8bed\u8a00\u6a21\u578b\u5728\u6b63\u786e\u6027\u3001\u903b\u8f91\u8fde\u8d2f\u6027\u3001\u65b9\u6cd5\u521b\u65b0\u6027\u3001\u5965\u8d5b\u63a8\u7406\u80fd\u529b\u4e0a\u5448\u73b0\u201c\u591a\u7ef4\u5ea6\u9886\u5148\u201d\u7684\u7279\u70b9\u3002 GPT-5\uff08\u601d\u8003\u6a21\u5f0f\uff09\u548cGemini 2.5 Pro\u65ad\u5c42\u9886\u5148\uff0cGPT-o3\uff0cClaude 4 Opus\uff08\u601d\u8003\u6a21\u5f0f\uff09\u5206\u5217\u7b2c\u4e09\u540d\u53ca\u7b2c\u56db\u540d; \u56fd\u4ea7\u6a21\u578b\u4e2d\uff0c\u901a\u4e49\u5343\u95ee3\uff08\u601d\u8003\u6a21\u5f0f\uff09\u548cStep R1_V_mini\u8868\u73b0\u9886\u5148\u3002\u603b\u4f53\u6765\u8bf4\uff0c\u56fd\u4ea7\u6a21\u578b\u5728\u590d\u6742\u63a8\u7406\u4e0a\u4ecd\u6709\u5f88\u5927\u8fdb\u6b65\u7a7a\u95f4\u3002<\/p>\n<p>\u6b64\u5916\uff0c\u5bf9\u6bd4\u540c\u516c\u53f8\u7684\u901a\u7528\u4e0e\u63a8\u7406\u6a21\u578b\u7248\u672c\uff0c\u6211\u4eec\u53d1\u73b0\u601d\u8003\u6a21\u5f0f\u4e0b\u7684\u6a21\u578b\u5728\u5965\u8d5b\u63a8\u7406\u80fd\u529b\u5404\u7ef4\u5ea6\u7684\u8868\u73b0\u666e\u904d\u66f4\u597d\u3002<\/p>\n<table width=\"568\">\n<tbody>\n<tr>\n<td width=\"48\"><strong>\u6392\u540d<\/strong><\/td>\n<td width=\"208\"><strong>\u6a21\u578b\u540d\u79f0<\/strong><\/td>\n<td width=\"68\"><strong>\u6b63\u786e\u6027<\/strong><\/td>\n<td width=\"80\"><strong>\u903b\u8f91\u8fde\u8d2f\u6027<\/strong><\/td>\n<td width=\"77\"><strong>\u65b9\u6cd5\u521b\u65b0\u6027<\/strong><\/td>\n<td width=\"87\"><strong>\u5965\u8d5b\u63a8\u7406\u80fd\u529b<\/strong><\/p>\n<p><strong>\u52a0\u6743\u5f97\u5206<\/strong><\/td>\n<\/tr>\n<tr>\n<td width=\"48\">1<\/td>\n<td width=\"208\">GPT-5\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/td>\n<td width=\"68\">48<\/td>\n<td width=\"80\">47<\/td>\n<td width=\"77\">44<\/td>\n<td width=\"87\">48<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">2<\/td>\n<td width=\"208\">Gemini 2.5 Pro<\/td>\n<td width=\"68\">48<\/td>\n<td width=\"80\">39<\/td>\n<td width=\"77\">36<\/td>\n<td width=\"87\">44<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">3<\/td>\n<td width=\"208\">GPT-o3<\/td>\n<td width=\"68\">36<\/td>\n<td width=\"80\">42<\/td>\n<td width=\"77\">39<\/td>\n<td width=\"87\">38<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">4<\/td>\n<td width=\"208\">Claude 4 Opus\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/td>\n<td width=\"68\">30<\/td>\n<td width=\"80\">36<\/td>\n<td width=\"77\">39<\/td>\n<td width=\"87\">33<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">5<\/td>\n<td width=\"208\">Gemini 2.5 Flash<\/td>\n<td width=\"68\">35<\/td>\n<td width=\"80\">28<\/td>\n<td width=\"77\">31<\/td>\n<td width=\"87\">32<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">5<\/td>\n<td width=\"208\">GPT-o4 mini<\/td>\n<td width=\"68\">32<\/td>\n<td width=\"80\">33<\/td>\n<td width=\"77\">33<\/td>\n<td width=\"87\">32<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">7<\/td>\n<td width=\"208\">\u901a\u4e49\u5343\u95ee3\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/td>\n<td width=\"68\">29<\/td>\n<td width=\"80\">25<\/td>\n<td width=\"77\">28<\/td>\n<td width=\"87\">28<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">7<\/td>\n<td width=\"208\">Step R1_V_mini<\/td>\n<td width=\"68\">26<\/td>\n<td width=\"80\">33<\/td>\n<td width=\"77\">22<\/td>\n<td width=\"87\">28<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">9<\/td>\n<td width=\"208\">GLM_Z1_Air<\/td>\n<td width=\"68\">27<\/td>\n<td width=\"80\">31<\/td>\n<td width=\"77\">22<\/td>\n<td width=\"87\">27<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">9<\/td>\n<td width=\"208\">\u65e5\u65e5\u65b0 V6\u63a8\u7406<\/td>\n<td width=\"68\">27<\/td>\n<td width=\"80\">28<\/td>\n<td width=\"77\">22<\/td>\n<td width=\"87\">27<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">11<\/td>\n<td width=\"208\">\u901a\u4e49\u5343\u95ee3<\/td>\n<td width=\"68\">25<\/td>\n<td width=\"80\">31<\/td>\n<td width=\"77\">17<\/td>\n<td width=\"87\">26<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">12<\/td>\n<td width=\"208\">\u6587\u5fc3\u4e00\u8a004.5-Turbo<\/td>\n<td width=\"68\">25<\/td>\n<td width=\"80\">25<\/td>\n<td width=\"77\">19<\/td>\n<td width=\"87\">24<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">13<\/td>\n<td width=\"208\">Grok 3\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/td>\n<td width=\"68\">21<\/td>\n<td width=\"80\">28<\/td>\n<td width=\"77\">25<\/td>\n<td width=\"87\">23<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">14<\/td>\n<td width=\"208\">GPT-5\uff08\u81ea\u52a8\u6a21\u5f0f\uff09<\/td>\n<td width=\"68\">22<\/td>\n<td width=\"80\">22<\/td>\n<td width=\"77\">28<\/td>\n<td width=\"87\">22<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">14<\/td>\n<td width=\"208\">DeepSeek-V3\uff08\u6df1\u5ea6\u6c42\u7d22-V3\uff09<\/td>\n<td width=\"68\">26<\/td>\n<td width=\"80\">14<\/td>\n<td width=\"77\">22<\/td>\n<td width=\"87\">22<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">16<\/td>\n<td width=\"208\">Claude 4 Opus<\/td>\n<td width=\"68\">22<\/td>\n<td width=\"80\">17<\/td>\n<td width=\"77\">31<\/td>\n<td width=\"87\">21<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">17<\/td>\n<td width=\"208\">\u8c46\u53051.5 Pro\uff08\u601d\u8003\u6a21\u5f0f\uff09<\/td>\n<td width=\"68\">22<\/td>\n<td width=\"80\">17<\/td>\n<td width=\"77\">22<\/td>\n<td width=\"87\">20<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">17<\/td>\n<td width=\"208\">DeepSeek-R1\uff08\u6df1\u5ea6\u6c42\u7d22-R1\uff09<\/td>\n<td width=\"68\">17<\/td>\n<td width=\"80\">25<\/td>\n<td width=\"77\">22<\/td>\n<td width=\"87\">20<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">19<\/td>\n<td width=\"208\">Grok 3<\/td>\n<td width=\"68\">20<\/td>\n<td width=\"80\">19<\/td>\n<td width=\"77\">17<\/td>\n<td width=\"87\">19<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">19<\/td>\n<td width=\"208\">Grok 4<\/td>\n<td width=\"68\">19<\/td>\n<td width=\"80\">17<\/td>\n<td width=\"77\">25<\/td>\n<td width=\"87\">19<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">21<\/td>\n<td width=\"208\">\u6587\u5fc3\u4e00\u8a00 X1-Turbo<\/td>\n<td width=\"68\">17<\/td>\n<td width=\"80\">19<\/td>\n<td width=\"77\">14<\/td>\n<td width=\"87\">17<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">21<\/td>\n<td width=\"208\">\u6df7\u5143-T1<\/td>\n<td width=\"68\">17<\/td>\n<td width=\"80\">17<\/td>\n<td width=\"77\">19<\/td>\n<td width=\"87\">17<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">21<\/td>\n<td width=\"208\">\u6df7\u5143-TurboS<\/td>\n<td width=\"68\">17<\/td>\n<td width=\"80\">17<\/td>\n<td width=\"77\">19<\/td>\n<td width=\"87\">17<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">21<\/td>\n<td width=\"208\">Kimi-k1.5<\/td>\n<td width=\"68\">17<\/td>\n<td width=\"80\">19<\/td>\n<td width=\"77\">11<\/td>\n<td width=\"87\">17<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">25<\/td>\n<td width=\"208\">\u8c46\u53051.5 Pro<\/td>\n<td width=\"68\">16<\/td>\n<td width=\"80\">17<\/td>\n<td width=\"77\">19<\/td>\n<td width=\"87\">16<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">26<\/td>\n<td width=\"208\">GLM-4-plus\uff08\u667a\u8c31-4-Plus\uff09<\/td>\n<td width=\"68\">12<\/td>\n<td width=\"80\">17<\/td>\n<td width=\"77\">8<\/td>\n<td width=\"87\">13<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">27<\/td>\n<td width=\"208\">GPT-4o<\/td>\n<td width=\"68\">13<\/td>\n<td width=\"80\">8<\/td>\n<td width=\"77\">19<\/td>\n<td width=\"87\">12<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">27<\/td>\n<td width=\"208\">Spark 4.0 Ultra\uff08\u8baf\u98de\u661f\u706b 4.0 Ultra\uff09<\/td>\n<td width=\"68\">13<\/td>\n<td width=\"80\">11<\/td>\n<td width=\"77\">14<\/td>\n<td width=\"87\">12<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">29<\/td>\n<td width=\"208\">Baichuan4-Turbo\uff08\u767e\u5ddd4-Turbo\uff09<\/td>\n<td width=\"68\">8<\/td>\n<td width=\"80\">19<\/td>\n<td width=\"77\">11<\/td>\n<td width=\"87\">11<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">29<\/td>\n<td width=\"208\">GPT-4.1<\/td>\n<td width=\"68\">11<\/td>\n<td width=\"80\">8<\/td>\n<td width=\"77\">17<\/td>\n<td width=\"87\">11<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">31<\/td>\n<td width=\"208\">Kimi<\/td>\n<td width=\"68\">6<\/td>\n<td width=\"80\">14<\/td>\n<td width=\"77\">17<\/td>\n<td width=\"87\">9<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">31<\/td>\n<td width=\"208\">Llama 3.3 70B<\/td>\n<td width=\"68\">7<\/td>\n<td width=\"80\">14<\/td>\n<td width=\"77\">6<\/td>\n<td width=\"87\">9<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">33<\/td>\n<td width=\"208\">Yi-Lightning\uff08\u96f6\u4e00-Lightning\uff09<\/td>\n<td width=\"68\">6<\/td>\n<td width=\"80\">11<\/td>\n<td width=\"77\">14<\/td>\n<td width=\"87\">8<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">33<\/td>\n<td width=\"208\">\u65e5\u65e5\u65b0 V6 Pro<\/td>\n<td width=\"68\">8<\/td>\n<td width=\"80\">8<\/td>\n<td width=\"77\">6<\/td>\n<td width=\"87\">8<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">35<\/td>\n<td width=\"208\">MiniMax-01<\/td>\n<td width=\"68\">5<\/td>\n<td width=\"80\">11<\/td>\n<td width=\"77\">8<\/td>\n<td width=\"87\">7<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">35<\/td>\n<td width=\"208\">Step2<\/td>\n<td width=\"68\">6<\/td>\n<td width=\"80\">8<\/td>\n<td width=\"77\">8<\/td>\n<td width=\"87\">7<\/td>\n<\/tr>\n<tr>\n<td width=\"48\">35<\/td>\n<td width=\"208\">360\u667a\u81112-o1<\/td>\n<td width=\"68\">7<\/td>\n<td width=\"80\">6<\/td>\n<td width=\"77\">8<\/td>\n<td width=\"87\">7<\/td>\n<\/tr>\n<tr>\n<td colspan=\"6\" width=\"568\">Note: \u6240\u6709\u5206\u6570\u5747\u4e3a\u56db\u820d\u4e94\u5165\u5f97\u5206\u7ed3\u679c\u3002<\/td>\n<\/tr>\n<\/tbody>\n<\/table>\n<p>\u8868 2\uff1a\u5965\u8d5b\u63a8\u7406\u80fd\u529b\u6392\u540d<\/p>\n<p>\u8bf7<a href=\"https:\/\/www.hkubs.hku.hk\/aimodelrankings\/leaderboards\/advancedreasoningCapabilities.html\"><span>\u6309\u6b64<\/span><\/a>\u9605\u8bfb\u300aAI\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u6d4b\u8bc4\u62a5\u544a\u300b\u5168\u6587<\/p>\n<p>\u7efc\u5408\u4ee5\u4e0a\u8bc4\u4f30\u53ef\u77e5\uff0c\u5728\u5730\u57df\u4e0a\uff0c\u7f8e\u56fd\u6a21\u578b\u5728\u591a\u6a21\u6001\u548c\u5965\u8d5b\u63a8\u7406\u4e2d\u8868\u73b0\u7a81\u51fa\uff0c\u6682\u65f6\u9886\u5148; \u4e2d\u56fd\u6a21\u578b\u4ecd\u9700\u5728\u6df1\u5c42\u8bed\u5883\u7406\u89e3\u3001\u590d\u6742\u63a8\u7406\u94fe\u6216\u521b\u9020\u6027\u89e3\u51b3\u95ee\u9898\u4e0a\u5f25\u8865\u5dee\u8ddd\u3002 \u6b64\u5916\uff0c\u63a8\u7406\u6a21\u578b\u5728\u9ad8\u7aef\u63a8\u7406\u80fd\u529b\u9886\u57df\u7684\u8868\u73b0\u666e\u904d\u4f18\u4e8e\u901a\u7528\u6a21\u578b\u3002<\/p>\n<p>\u5c55\u671b\u672a\u6765\uff0c\u4eba\u5de5\u667a\u80fd\u9700\u5728\u8de8\u6a21\u6001\u6df1\u5ea6\u878d\u5408\u548c\u6781\u7aef\u590d\u6742\u95ee\u9898\u7684\u521b\u9020\u6027\u89e3\u51b3\u4e0a\u6301\u7eed\u5b9e\u73b0\u6838\u5fc3\u7a81\u7834\u3002\u5bf9\u4e8e\u4e2d\u56fd\u6a21\u578b\u800c\u8a00\uff0c\u5176\u5173\u952e\u5728\u4e8e\u4f9d\u6258\u672c\u571f\u573a\u666f\u7684\u72ec\u7279\u4f18\u52bf\uff0c\u7cbe\u51c6\u8865\u9f50\u9ad8\u9636\u63a8\u7406\u80fd\u529b\u4e0a\u7684\u77ed\u677f\uff0c\u4ece\u800c\u63a8AI\u4ece\u201c\u80fd\u7528\u201d\u5411\u201c\u771f\u667a\u6167\u201d\u8fc8\u8fdb\uff0c\u5e76\u5e94\u7528\u4e8e\u66f4\u5e7f\u6cdb\u3001\u66f4\u590d\u6742\u7684\u573a\u666f\u4e2d\u3002<\/p>\n<p><strong><u>\u56fe\u7247<\/u><\/strong><\/p>\n<p><img fetchpriority=\"high\" decoding=\"async\" class=\"alignnone wp-image-245274 size-full\" src=\"https:\/\/www.hkubs.hku.hk\/wp-content\/uploads\/2025\/10\/JackJiang01.jpg\" alt=\"\" width=\"868\" height=\"1258\" srcset=\"https:\/\/www.hkubs.hku.hk\/wp-content\/uploads\/2025\/10\/JackJiang01.jpg 868w, https:\/\/www.hkubs.hku.hk\/wp-content\/uploads\/2025\/10\/JackJiang01-207x300.jpg 207w, https:\/\/www.hkubs.hku.hk\/wp-content\/uploads\/2025\/10\/JackJiang01-707x1024.jpg 707w, https:\/\/www.hkubs.hku.hk\/wp-content\/uploads\/2025\/10\/JackJiang01-768x1113.jpg 768w\" sizes=\"(max-width: 868px) 100vw, 868px\" \/><\/p>\n<p>\u6e2f\u5927\u7ecf\u7ba1\u5b66\u9662\u521b\u65b0\u53ca\u4fe1\u606f\u7ba1\u7406\u5b66\u6559\u6388\u517c\u590f\u5229\u83b1\u4f09\u4fea\u57fa\u91d1\u6559\u6388<a href=\"https:\/\/www.hkubs.hku.hk\/sc\/people\/zhenhui-jack-jiang\/\"><strong>\u848b\u9547\u8f89\u6559\u6388<\/strong><\/a><\/p>\n<p>\u8bf7<a href=\"https:\/\/drive.google.com\/drive\/folders\/1AQs5bn8JVDpdqfM50EWmYbcZl5pwEQ5p?usp=sharing\">\u6309\u6b64<\/a>\u4e0b\u8f7d\u9ad8\u6e05\u56fe\u7247\u3002<\/p>\n","protected":false},"featured_media":0,"template":"","meta":{"_lmt_disableupdate":"no","_lmt_disable":"","footnotes":""},"class_list":["post-245293","hkubs-media","type-hkubs-media","status-publish","hentry","media-categories-press-release-sc","media-topic-categories-research-sc"],"aioseo_notices":[],"_links":{"self":[{"href":"https:\/\/www.hkubs.hku.hk\/sc\/wp-json\/wp\/v2\/hkubs-media\/245293","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.hkubs.hku.hk\/sc\/wp-json\/wp\/v2\/hkubs-media"}],"about":[{"href":"https:\/\/www.hkubs.hku.hk\/sc\/wp-json\/wp\/v2\/types\/hkubs-media"}],"version-history":[{"count":1,"href":"https:\/\/www.hkubs.hku.hk\/sc\/wp-json\/wp\/v2\/hkubs-media\/245293\/revisions"}],"predecessor-version":[{"id":245294,"href":"https:\/\/www.hkubs.hku.hk\/sc\/wp-json\/wp\/v2\/hkubs-media\/245293\/revisions\/245294"}],"wp:attachment":[{"href":"https:\/\/www.hkubs.hku.hk\/sc\/wp-json\/wp\/v2\/media?parent=245293"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}