{"id":34993,"date":"2024-12-16T14:58:56","date_gmt":"2024-12-16T06:58:56","guid":{"rendered":"https:\/\/17aitech.com\/?p=34993"},"modified":"2024-12-16T14:58:56","modified_gmt":"2024-12-16T06:58:56","slug":"llama3%e8%ae%ad%e7%bb%83%e6%af%8f3%e5%b0%8f%e6%97%b6%e5%b4%a9%e4%b8%80%e6%ac%a1%ef%bc%9f%e8%b1%86%e5%8c%85%e5%a4%a7%e6%a8%a1%e5%9e%8b%e3%80%81%e6%b8%af%e5%a4%a7%e5%9b%a2%e9%98%9f%e4%b8%ba%e8%84%86","status":"publish","type":"post","link":"https:\/\/17aitech.com\/?p=34993","title":{"rendered":"Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548"},"content":{"rendered":"<p>\u6587\u7ae0\u6765\u6e90\u4e8e\u4e92\u8054\u7f51:<a href=\"https:\/\/www.jiqizhixin.com\/articles\/2024-08-08-7\" target=\"_blank\">Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548<\/a><\/p>\n<blockquote data-author-name=\"\" data-content-utf8-length=\"115\" data-source-title=\"\" data-type=\"2\" data-url=\"\">\n<section>\n<section>\n<p>\u4f34\u968f\u5927\u6a21\u578b\u8fed\u4ee3\u901f\u5ea6\u8d8a\u6765\u8d8a\u5feb\uff0c\u8bad\u7ec3\u96c6\u7fa4\u89c4\u6a21\u8d8a\u6765\u8d8a\u5927\uff0c\u9ad8\u9891\u7387\u7684\u8f6f\u786c\u4ef6\u6545\u969c\u5df2\u7ecf\u6210\u4e3a\u963b\u788d\u8bad\u7ec3\u6548\u7387\u8fdb\u4e00\u6b65\u63d0\u9ad8\u7684\u75db\u70b9\uff0c\u68c0\u67e5\u70b9\uff08Checkpoint\uff09\u7cfb\u7edf\u5728\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u8d1f\u8d23\u72b6\u6001\u7684\u5b58\u50a8\u548c\u6062\u590d\uff0c\u5df2\u7ecf\u6210\u4e3a\u514b\u670d\u8bad\u7ec3\u6545\u969c\u3001\u4fdd\u969c\u8bad\u7ec3\u8fdb\u5ea6\u548c\u63d0\u9ad8\u8bad\u7ec3\u6548\u7387\u7684\u5173\u952e\u3002<\/p>\n<\/section>\n<\/section>\n<\/blockquote>\n<blockquote data-author-name=\"\" data-content-utf8-length=\"214\" data-source-title=\"\" data-type=\"2\" data-url=\"\">\n<section>\n<p>\u8fd1\u65e5\uff0c<mark data-type=\"institutions\" data-id=\"7092494f-e4a9-4175-8efe-b5ddb66a9878\">\u5b57\u8282\u8df3\u52a8<\/mark>\u8c46\u5305\u5927\u6a21\u578b\u56e2\u961f\u4e0e\u9999\u6e2f\u5927\u5b66\u8054\u5408\u63d0\u51fa\u4e86 ByteCheckpoint\u3002\u8fd9\u662f\u4e00\u4e2a PyTorch \u539f\u751f\uff0c\u517c\u5bb9\u591a\u4e2a\u8bad\u7ec3\u6846\u67b6\uff0c\u652f\u6301 Checkpoint \u7684\u9ad8\u6548\u8bfb\u5199\u548c\u81ea\u52a8\u91cd\u65b0\u5207\u5206\u7684\u5927\u6a21\u578b Checkpointing \u7cfb\u7edf\uff0c\u76f8\u6bd4\u73b0\u6709\u65b9\u6cd5\u6709\u663e\u8457\u6027\u80fd\u63d0\u5347\u548c\u6613\u7528\u6027\u4f18\u52bf\u3002\u672c\u6587\u4ecb\u7ecd\u4e86\u5927\u6a21\u578b\u8bad\u7ec3\u63d0\u6548\u4e2d Checkpoint \u65b9\u5411\u9762\u4e34\u7684\u6311\u6218\uff0c\u603b\u7ed3 ByteCheckpoint \u7684\u89e3\u51b3\u601d\u8def\u3001\u7cfb\u7edf\u8bbe\u8ba1\u3001I\/O \u6027\u80fd\u4f18\u5316\u6280\u672f\uff0c\u4ee5\u53ca\u5728\u5b58\u50a8\u6027\u80fd\u548c\u8bfb\u53d6\u6027\u80fd\u6d4b\u8bd5\u7684\u5b9e\u9a8c\u7ed3\u679c\u3002<\/p>\n<\/section>\n<\/blockquote>\n<p>Meta \u5b98\u65b9\u6700\u8fd1\u62ab\u9732\u4e86\u5728 16384 \u5757 H100 80GB \u8bad\u7ec3\u96c6\u7fa4\u4e0a\u8fdb\u884c Llama3 405B \u8bad\u7ec3\u7684\u6545\u969c\u7387 \u2014\u2014 \u77ed\u77ed 54 \u5929\uff0c\u53d1\u751f 419 \u6b21\u4e2d\u65ad\uff0c\u5e73\u5747\u6bcf\u4e09\u5c0f\u65f6\u5d29\u6e83\u4e00\u6b21\uff0c\u5f15\u6765\u4e0d\u5c11\u4ece\u4e1a\u8005\u5173\u6ce8\u3002<\/p>\n<p>\u6b63\u5982\u4e1a\u5185\u4e00\u53e5\u5e38\u8a00\uff0c\u5927\u578b\u8bad\u7ec3\u7cfb\u7edf\u552f\u4e00\u786e\u5b9a\u7684\uff0c\u4fbf\u662f\u8f6f\u786c\u4ef6\u6545\u969c\u3002\u968f\u7740\u8bad\u7ec3\u89c4\u6a21\u4e0e\u6a21\u578b\u5927\u5c0f\u7684\u65e5\u76ca\u589e\u957f\uff0c\u514b\u670d\u8f6f\u786c\u4ef6\u6545\u969c\uff0c\u63d0\u9ad8\u8bad\u7ec3\u6548\u7387\u6210\u4e3a\u5927\u6a21\u578b\u8fed\u4ee3\u7684\u91cd\u8981\u5f71\u54cd\u8981\u7d20\u3002<\/p>\n<p>Checkpoint \u5df2\u6210\u4e3a\u8bad\u7ec3\u63d0\u6548\u5173\u952e\u3002\u5728 Llama \u8bad\u7ec3\u62a5\u544a\u4e2d\uff0c\u6280\u672f\u56e2\u961f\u63d0\u5230\uff0c\u4e3a\u4e86\u5bf9\u6297\u9ad8\u6545\u969c\u7387\uff0c\u9700\u8981\u5728\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u9891\u7e41\u5730\u8fdb\u884c Checkpoint \uff0c\u4fdd\u5b58\u8bad\u7ec3\u4e2d\u7684\u6a21\u578b\u3001<mark data-type=\"concepts\" data-id=\"fa50298e-1a85-4af0-ae96-a82708f4b610\">\u4f18\u5316\u5668<\/mark>\u3001\u6570\u636e\u8bfb\u53d6\u5668\u72b6\u6001\uff0c\u51cf\u5c11\u8bad\u7ec3\u8fdb\u5ea6\u635f\u5931\u3002<\/p>\n<p><strong><mark data-type=\"institutions\" data-id=\"7092494f-e4a9-4175-8efe-b5ddb66a9878\">\u5b57\u8282\u8df3\u52a8<\/mark>\u8c46\u5305\u5927\u6a21\u578b\u56e2\u961f\u4e0e\u6e2f\u5927\u8fd1\u671f\u516c\u5f00\u4e86\u6210\u679c \u2014\u2014 ByteCheckpoint \uff0c\u4e00\u4e2a PyTorch \u539f\u751f\uff0c\u517c\u5bb9\u591a\u4e2a\u8bad\u7ec3\u6846\u67b6\uff0c\u652f\u6301 Checkpoint \u7684\u9ad8\u6548\u8bfb\u5199\u548c\u81ea\u52a8\u91cd\u65b0\u5207\u5206\u7684\u5927\u6a21\u578b Checkpointing \u7cfb\u7edf\u3002<\/strong><\/p>\n<p><strong>\u4e0e\u57fa\u7ebf\u65b9\u6cd5\u76f8\u6bd4\uff0cByteCheckpoint \u5728 Checkpoint \u4fdd\u5b58\u4e0a\u6027\u80fd\u63d0\u5347\u9ad8\u8fbe 529.22 \u500d\uff0c\u5728\u52a0\u8f7d\u4e0a\uff0c\u6027\u80fd\u63d0\u5347\u9ad8\u8fbe 3.51 \u500d\u3002<\/strong>\u6781\u7b80\u7684\u7528\u6237\u63a5\u53e3\u548c Checkpoint \u81ea\u52a8\u91cd\u65b0\u5207\u5206\u529f\u80fd\uff0c\u663e\u8457\u964d\u4f4e\u4e86\u7528\u6237\u4e0a\u624b\u548c\u4f7f\u7528\u6210\u672c\uff0c\u63d0\u9ad8\u4e86\u7cfb\u7edf\u7684\u6613\u7528\u6027\u3002<\/p>\n<section><strong>\u76ee\u524d\u8bba\u6587\u6210\u679c\u5df2\u5bf9\u5916\u516c\u5f00<\/strong>\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png\"><\/a><\/p>\n<ul>\n<li>\n<section>ByteCheckpoint: A Unified Checkpointing System for LLM Development<\/section>\n<\/li>\n<li>\n<section>\u8bba\u6587\u94fe\u63a5\uff1ahttps:\/\/team.doubao.com\/zh\/publication\/bytecheckpoint-a-unified-checkpointing-system-for-llm-development?view_from=research<\/section>\n<\/li>\n<\/ul>\n<section><\/section>\n<section><strong>Checkpoint \u6280\u672f\u5728\u5927\u6a21\u578b\u8bad\u7ec3\u4e2d\u7684\u6280\u672f\u6311\u6218\u00a0<\/strong><\/section>\n<section><\/section>\n<section>\u5f53\u524d Checkpoint \u76f8\u5173\u6280\u672f\u5728\u652f\u6301\u5927\u6a21\u578b\u8bad\u7ec3\u63d0\u6548\u4e2d\uff0c\u5171\u9762\u4e34\u56db\u4e2a\u65b9\u9762\u6311\u6218\uff1a<\/section>\n<section><\/section>\n<ul>\n<li>\n<section><strong>\u73b0\u6709\u7cfb\u7edf\u8bbe\u8ba1\u5b58\u5728\u7f3a\u9677\uff0c\u663e\u8457\u589e\u52a0\u8bad\u7ec3\u989d\u5916 I\/O \u5f00\u9500<\/strong><\/section>\n<\/li>\n<\/ul>\n<section><\/section>\n<section>\u5728\u8bad\u7ec3\u5de5\u4e1a\u7ea7\u522b\u7684\u5927<mark data-type=\"tech_tasks\" data-id=\"bf35ef94-d956-4033-a533-0c0828308c36\">\u8bed\u8a00\u6a21\u578b<\/mark> (LLM) \u7684\u8fc7\u7a0b\u4e2d\uff0c\u8bad\u7ec3\u72b6\u6001\u9700\u8981\u901a\u8fc7\u68c0\u67e5\u70b9\u6280\u672f ( Checkpointing ) \u8fdb\u884c\u4fdd\u5b58\u548c\u6301\u4e45\u5316\u3002\u901a\u5e38\u60c5\u51b5\u4e0b\uff0c\u4e00\u4e2a Checkpoint \u5305\u62ec 5 \u4e2a\u90e8\u5206 (\u6a21\u578b\uff0c<mark data-type=\"concepts\" data-id=\"fa50298e-1a85-4af0-ae96-a82708f4b610\">\u4f18\u5316\u5668<\/mark>\uff0c\u6570\u636e\u8bfb\u53d6\u5668\uff0c\u968f\u673a\u6570\u548c\u7528\u6237\u81ea\u5b9a\u4e49\u914d\u7f6e)\u3002\u8fd9\u4e00\u8fc7\u7a0b\u5f80\u5f80\u4f1a\u7ed9\u8bad\u7ec3\u5e26\u6765\u5206\u949f\u7ea7\u522b\u7684\u963b\u585e\uff0c\u4e25\u91cd\u5f71\u54cd\u8bad\u7ec3\u6548\u7387\u3002<\/section>\n<section><\/section>\n<section>\u5728\u4f7f\u7528\u8fdc\u7a0b\u6301\u4e45\u5316\u5b58\u50a8\u7cfb\u7edf\u7684\u5927\u89c4\u6a21\u8bad\u7ec3\u573a\u666f\u4e0b\uff0c\u73b0\u6709\u7684 Checkpointing \u7cfb\u7edf\u6ca1\u6709\u5145\u5206\u5229\u7528 Checkpoint \u4fdd\u5b58\u8fc7\u7a0b\u4e2d GPU \u5230 CPU \u5185\u5b58\u62f7\u8d1d ( D2H \u590d\u5236)\uff0c\u5e8f\u5217\u5316\uff0c\u672c\u5730\u5b58\u76d8\uff0c\u4e0a\u4f20\u5230\u5b58\u50a8\u7cfb\u7edf\u5404\u4e2a\u9636\u6bb5\u7684\u6267\u884c\u72ec\u7acb\u6027\u3002<\/section>\n<section><\/section>\n<section>\u6b64\u5916\uff0c\u4e0d\u540c\u8bad\u7ec3\u8fdb\u7a0b\u5171\u540c\u5206\u62c5 Checkpoint \u5b58\u53d6\u4efb\u52a1\u7684\u5e76\u884c\u5904\u7406\u6f5c\u529b\u4e5f\u6ca1\u6709\u88ab\u5145\u5206\u53d1\u6398\u3002\u8fd9\u4e9b\u7cfb\u7edf\u8bbe\u8ba1\u4e0a\u7684\u4e0d\u8db3\u589e\u52a0\u4e86 Checkpoint \u8bad\u7ec3\u5e26\u6765\u7684\u989d\u5916 I\/O \u5f00\u9500\u3002<\/section>\n<section><\/section>\n<ul>\n<li>\n<section><strong>Checkpoint \u91cd\u65b0\u5207\u5206\u56f0\u96be\uff0c\u624b\u52a8\u5207\u5206\u811a\u672c\u5f00\u53d1\u7ef4\u62a4\u5f00\u9500\u8fc7\u9ad8<\/strong><\/section>\n<\/li>\n<\/ul>\n<section><\/section>\n<section>\u5728 LLM \u7684\u4e0d\u540c\u8bad\u7ec3\u9636\u6bb5 (\u9884\u8bad\u7ec3\u5230 SFT \u6216\u8005 RLHF ) \u4ee5\u53ca\u4e0d\u540c\u4efb\u52a1 (\u4ece\u8bad\u7ec3\u4efb\u52a1\u62c9\u53d6\u4e0d\u540c\u9636\u6bb5\u7684 Checkpoint \u8fdb\u884c\u6267\u884c\u81ea\u52a8\u8bc4\u4f30) \u4e4b\u95f4\u8fdb\u884c Checkpoint \u8fc1\u79fb\u65f6\uff0c\u901a\u5e38\u9700\u8981\u5bf9\u4fdd\u5b58\u5728\u6301\u4e45\u5316\u5b58\u50a8\u7cfb\u7edf\u4e2d\u7684 Checkpoint \u8fdb\u884c\u91cd\u65b0\u5207\u5206 ( Checkpoint Resharding ) \uff0c\u4ee5\u9002\u5e94\u4e0b\u6e38\u4efb\u52a1\u7684\u65b0\u5e76\u884c\u5ea6\u914d\u7f6e\u4ee5\u53ca\u53ef\u7528 GPU \u8d44\u6e90\u7684\u914d\u989d\u3002<\/section>\n<section><\/section>\n<section>\u73b0\u6709 Checkpointing \u7cfb\u7edf [1, 2, 3, 4] \u90fd\u5047\u8bbe\u5b58\u50a8\u548c\u52a0\u8f7d\u65f6\uff0c\u5e76\u884c\u5ea6\u914d\u7f6e\u548c GPU \u8d44\u6e90\u4fdd\u6301\u4e0d\u53d8\uff0c\u65e0\u6cd5\u5904\u7406 Checkpoint \u91cd\u65b0\u5207\u5206\u7684\u9700\u6c42\u3002\u5de5\u4e1a\u754c\u76ee\u524d\u5e38\u89c1\u7684\u89e3\u51b3\u529e\u6cd5\u662f \u2014\u2014 \u4e3a\u4e0d\u540c\u6a21\u578b\u5b9a\u5236 Checkpoint \u5408\u5e76\u6216\u8005\u91cd\u65b0\u5207\u5206\u811a\u672c\u3002\u8fd9\u79cd\u65b9\u6cd5\u5e26\u6765\u4e86\u5927\u91cf\u5f00\u53d1\u4e0e\u7ef4\u62a4\u5f00\u9500\uff0c\u53ef\u6269\u5c55\u6027\u8f83\u5dee\u3002<\/section>\n<section><\/section>\n<ul>\n<li>\n<section><strong>\u4e0d\u540c\u7684\u8bad\u7ec3\u6846\u67b6 Checkpoint \u6a21\u5757\u5272\u88c2\uff0c\u4e3a Checkpoint \u7edf\u4e00\u7ba1\u7406\u548c\u6027\u80fd\u4f18\u5316\u5e26\u6765\u6311\u6218<\/strong><\/section>\n<\/li>\n<\/ul>\n<section><\/section>\n<section>\u5728\u5de5\u4e1a\u754c\u7684\u8bad\u7ec3\u5e73\u53f0\u4e0a\uff0c\u5de5\u7a0b\u5e08\u4e0e\u79d1\u5b66\u5bb6\u5f80\u5f80\u4f1a\u6839\u636e\u4efb\u52a1\u7279\u6027\uff0c\u9009\u62e9\u5408\u9002\u6846\u67b6 (Megatron-LM [5], FSDP [6], DeepSpeed [7], veScale [8, 9]) \u8fdb\u884c\u8bad\u7ec3\uff0c\u5e76\u4fdd\u5b58 Checkpoint \u5230\u5b58\u50a8\u7cfb\u7edf\u3002\u7136\u800c\uff0c\u8fd9\u4e9b\u4e0d\u540c\u7684\u8bad\u7ec3\u6846\u67b6\u90fd\u5177\u6709\u81ea\u5df1\u72ec\u7acb\u7684 Checkpoint \u683c\u5f0f\u4ee5\u53ca\u8bfb\u5199\u6a21\u5757\u3002\u4e0d\u540c\u8bad\u7ec3\u6846\u67b6\u7684 Checkpoint \u6a21\u5757\u8bbe\u8ba1\u4e0d\u5c3d\u76f8\u540c\uff0c\u4e3a\u5e95\u5c42\u7cfb\u7edf\u8fdb\u884c\u7edf\u4e00\u7684 Checkpoint \u7ba1\u7406\u4ee5\u53ca\u6027\u80fd\u4f18\u5316\u5e26\u6765\u4e86\u6311\u6218\u3002<\/section>\n<section><\/section>\n<ul>\n<li>\n<section><strong>\u5206\u5e03\u5f0f\u8bad\u7ec3\u7cfb\u7edf\u7684\u7528\u6237\u9762\u4e34\u591a\u91cd\u56f0\u6270<\/strong><\/section>\n<\/li>\n<\/ul>\n<section><\/section>\n<section>\u4ece\u8bad\u7ec3\u7cfb\u7edf\u7684\u7528\u6237\uff08 AI \u7814\u7a76\u79d1\u5b66\u5bb6\u6216\u5de5\u7a0b\u5e08\uff09\u7684\u89d2\u5ea6\u51fa\u53d1\uff0c\u7528\u6237\u4f7f\u7528\u5206\u5e03\u5f0f\u8bad\u7ec3\u7cfb\u7edf\u65f6\uff0c\u5728 Checkpoint \u65b9\u5411\u5f80\u5f80\u4f1a\u88ab\u4e09\u4e2a\u95ee\u9898\u56f0\u6270\uff1a<\/section>\n<section><\/section>\n<section>1\uff09\u5982\u4f55\u9ad8\u6548\u5730\u5b58\u50a8 Checkpoint \uff0c\u5728\u4e0d\u5f71\u54cd\u8bad\u7ec3\u6548\u7387\u7684\u60c5\u51b5\u4e0b\u4fdd\u5b58 Checkpoint\u3002<\/section>\n<section>2\uff09\u5982\u4f55\u91cd\u65b0\u5207\u5206 Checkpoint \uff0c\u5bf9\u4e8e\u5728\u4e00\u4e2a\u5e76\u884c\u5ea6\u4e0b\u5b58\u50a8\u7684 Checkpoint \uff0c\u6839\u636e\u65b0\u7684\u5e76\u884c\u5ea6\u6b63\u786e\u8bfb\u5165\u3002<\/section>\n<section>3\uff09\u5982\u4f55\u628a\u8bad\u7ec3\u5f97\u5230\u7684\u4ea7\u7269\u4e0a\u4f20\u5230\u4e91\u5b58\u50a8\u7cfb\u7edf\u4e0a\uff08 HDFS\uff0cS3 \u7b49\uff09\uff0c\u624b\u52a8\u7ba1\u7406\u591a\u4e2a\u5b58\u50a8\u7cfb\u7edf\uff0c\u5bf9\u7528\u6237\u6765\u8bf4\u5b66\u4e60\u548c\u4f7f\u7528\u6210\u672c\u8f83\u9ad8\u3002<\/section>\n<section><\/section>\n<section><strong>\u9488\u5bf9\u4e0a\u8ff0\u95ee\u9898\uff0c<mark data-type=\"institutions\" data-id=\"7092494f-e4a9-4175-8efe-b5ddb66a9878\">\u5b57\u8282\u8df3\u52a8<\/mark>\u8c46\u5305\u5927\u6a21\u578b\u56e2\u961f\u548c\u9999\u6e2f\u5927\u5b66\u5434\u5ddd\u6559\u6388\u5b9e\u9a8c\u5ba4\u8054\u5408\u63a8\u51fa\u4e86 ByteCheckpoint \u3002<\/strong><\/section>\n<section><\/section>\n<section>ByteCheckpoint \u662f\u4e00\u4e2a\u591a\u8bad\u7ec3\u6846\u67b6\u7edf\u4e00\uff0c\u652f\u6301\u591a\u5b58\u50a8\u540e\u7aef\uff0c\u5177\u5907\u81ea\u52a8 Checkpoint \u91cd\u65b0\u5207\u5206\u80fd\u529b\u7684\u9ad8\u6027\u80fd\u5206\u5e03\u5f0f Checkpointing \u7cfb\u7edf\u3002ByteCheckpoint \u63d0\u4f9b\u4e86\u7b80\u5355\u6613\u7528\u7684\u7528\u6237\u63a5\u53e3 \uff0c\u5b9e\u73b0\u4e86\u5927\u91cf I\/O \u6027\u80fd\u4f18\u5316\u6280\u672f\u63d0\u9ad8\u4e86\u5b58\u50a8\u548c\u8bfb\u53d6 Checkpoint \u6027\u80fd\uff0c\u5e76\u652f\u6301 Checkpoint \u5728\u4e0d\u540c\u5e76\u884c\u5ea6\u914d\u7f6e\u7684\u4efb\u52a1\u4e2d\u7684\u7075\u6d3b\u8fc1\u79fb\u3002<\/section>\n<section><\/section>\n<section><strong>\u7cfb\u7edf\u8bbe\u8ba1<\/strong><\/section>\n<section><\/section>\n<section><strong>\u5b58\u50a8\u67b6\u6784<\/strong><\/section>\n<section><\/section>\n<section>ByteCheckpoint \u91c7\u7528\u4e86\u5143\u6570\u636e \/ <mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u6570\u636e\u5206\u79bb\u7684\u5b58\u50a8\u67b6\u6784\uff0c\u5b9e\u73b0\u4e86 Checkpoint \u7ba1\u7406\u4e0e\u8bad\u7ec3\u6846\u67b6\u548c\u5e76\u884c\u5ea6\u7684\u89e3\u8026\u5408\u3002<\/section>\n<section><\/section>\n<section>\u4e0d\u540c\u8bad\u7ec3\u6846\u67b6\u4e2d\u7684\u6a21\u578b\u4ee5\u53ca<mark data-type=\"concepts\" data-id=\"fa50298e-1a85-4af0-ae96-a82708f4b610\">\u4f18\u5316\u5668<\/mark>\u7684<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247 ( Tensor Shard) \u00a0\u5b58\u50a8\u5728 storage \u6587\u4ef6\u4e2d\uff0c\u5143\u4fe1\u606f (TensorMeta, ShardMeta, ByteMeta) \u5b58\u50a8\u5230\u5168\u5c40\u552f\u4e00\u7684 metadata \u6587\u4ef6\u4e2d\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-b42c73d2c342ecebf2ef7e06560c9751.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-b42c73d2c342ecebf2ef7e06560c9751.png\"><\/a><\/p>\n<section>\u5f53\u4f7f\u7528\u4e0d\u540c\u7684\u5e76\u884c\u5ea6\u914d\u7f6e\u8bfb\u53d6 Checkpoint \u65f6\uff0c\u5982\u4e0b\u56fe\u6240\u793a\uff0c\u6bcf\u4e2a\u8bad\u7ec3\u8fdb\u7a0b\u53ea\u9700\u8981\u6839\u636e\u5f53\u524d\u7684\u5e76\u884c\u5ea6\u8bbe\u7f6e<mark data-type=\"concepts\" data-id=\"bf740558-f0f7-41a8-87a0-e695a97563b3\">\u67e5\u8be2<\/mark>\u5143\u4fe1\u606f\uff0c\u4fbf\u80fd\u591f\u83b7\u53d6\u8fdb\u7a0b\u6240\u9700\u8981<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u7684\u5b58\u50a8\u4f4d\u7f6e\uff0c\u518d\u6839\u636e\u4f4d\u7f6e\u76f4\u63a5\u8bfb\u53d6\uff0c\u5b9e\u73b0\u81ea\u52a8 Checkpoint \u91cd\u65b0\u5207\u5206\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-5d51fc0370bbc452ff64697114f2e764.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-5d51fc0370bbc452ff64697114f2e764.png\"><\/a><\/p>\n<section><strong>\u5de7\u89e3\u4e0d\u89c4\u5219<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u5206<\/strong><\/section>\n<section><\/section>\n<section>\u4e0d\u540c\u8bad\u7ec3\u6846\u67b6\u5728\u8fd0\u884c\u65f6\uff0c\u5f80\u5f80\u4f1a\u628a\u6a21\u578b\u6216\u8005<mark data-type=\"concepts\" data-id=\"fa50298e-1a85-4af0-ae96-a82708f4b610\">\u4f18\u5316\u5668<\/mark>\u4e2d<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u7684\u5f62\u72b6\u644a\u5e73 ( Flatten ) \u6210\u4e00\u7ef4\uff0c\u4ece\u800c\u63d0\u9ad8\u96c6\u5408\u901a\u4fe1\u6027\u80fd\u3002\u8fd9\u79cd\u644a\u5e73\u64cd\u4f5c\u7ed9 Checkpoint \u5b58\u50a8\u5e26\u6765\u4e86\u4e0d\u89c4\u5219<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u5206 \u00a0(Irregular Tensor Sharding) \u00a0\u7684\u6311\u6218\u3002<\/section>\n<section><\/section>\n<section>\u5982\u4e0b\u56fe\u6240\u793a\uff0c\u5728 Megatron-LM \u00a0(\u7531 NVIDIA \u7814\u53d1\u7684\u5206\u5e03\u5f0f\u5927\u6a21\u578b\u8bad\u7ec3\u6846\u67b6) \u548c veScale \u00a0(\u7531<mark data-type=\"institutions\" data-id=\"7092494f-e4a9-4175-8efe-b5ddb66a9878\">\u5b57\u8282\u8df3\u52a8<\/mark>\u7814\u53d1\u7684 PyTorch \u539f\u751f\u5206\u5e03\u5f0f\u5927\u6a21\u578b\u8bad\u7ec3\u6846\u67b6) \u4e2d\uff0c\u6a21\u578b<mark data-type=\"concepts\" data-id=\"2e982b73-88e2-41e8-a430-f7ae5a9af4bf\">\u53c2\u6570<\/mark>\u5bf9\u5e94\u7684<mark data-type=\"concepts\" data-id=\"fa50298e-1a85-4af0-ae96-a82708f4b610\">\u4f18\u5316\u5668<\/mark>\u72b6\u6001\u4f1a\u88ab\u5c55\u5e73\u4e3a\u4e00\u7ef4\u540e\u5408\u5e76\uff0c\u518d\u6839\u636e\u6570\u636e\u5e76\u884c\u5ea6\u5207\u5206\u3002\u8fd9\u5bfc\u81f4<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u88ab\u4e0d\u89c4\u5219\u5730\u5207\u5206\u5230\u4e0d\u540c\u8fdb\u7a0b\u4e4b\u4e2d\uff0c<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247\u7684\u5143\u4fe1\u606f\u65e0\u6cd5\u4f7f\u7528\u504f\u79fb\u91cf\u548c\u957f\u5ea6\u5143\u7ec4\u6765\u8868\u793a\uff0c\u7ed9\u5b58\u50a8\u548c\u8bfb\u53d6\u5e26\u6765\u56f0\u96be\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-99d6b2d3b74d024ddd918a54272b4662.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-99d6b2d3b74d024ddd918a54272b4662.png\"><\/a><\/p>\n<section>\u4e0d\u89c4\u5219<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u5206\u7684\u95ee\u9898\u5728 FSDP \u6846\u67b6\u4e2d\u4e5f\u540c\u6837\u5b58\u5728\u3002<\/section>\n<section><\/section>\n<section>\u4e3a\u6d88\u9664\u4e0d\u89c4\u5219\u5207\u5206\u7684<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247 \uff0cFSDP \u6846\u67b6\u5728\u5b58\u50a8 Checkpoint \u4e4b\u524d\u4f1a\u5728\u6240\u6709\u8fdb\u7a0b\u4e0a\u5bf9\u4e00\u7ef4<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247\u8fdb\u884c all-gather \u96c6\u5408\u901a\u4fe1\u4ee5\u53ca D2H \u590d\u5236\u64cd\u4f5c\uff0c\u4ee5\u83b7\u53d6\u5b8c\u6574\u4e0d\u89c4\u5219\u5207\u5206\u7684<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u3002\u8fd9\u79cd\u65b9\u6848\u5e26\u6765\u4e86\u6781\u5927\u7684\u901a\u4fe1\u548c\u9891\u7e41\u7684 GPU-CPU \u540c\u6b65\u5f00\u9500\uff0c\u4e25\u91cd\u5f71\u54cd\u4e86 Checkpoint \u5b58\u50a8\u7684\u6027\u80fd\u3002<\/section>\n<section><\/section>\n<section>\u9488\u5bf9\u8fd9\u4e2a\u95ee\u9898\uff0cByteCheckpoint \u63d0\u51fa\u4e86\u5f02\u6b65<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5408\u5e76 \u00a0(Asynchronous Tensor Merging) \u00a0\u6280\u672f\u3002<\/section>\n<section><\/section>\n<section>ByteCheckpoint \u9996\u5148\u627e\u51fa\u4e0d\u540c\u8fdb\u7a0b\u4e2d\u88ab\u4e0d\u89c4\u5219\u5207\u5206\u7684<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\uff0c\u4e4b\u540e\u91c7\u7528\u5f02\u6b65\u7684 P2P \u901a\u4fe1\uff0c\u628a\u8fd9\u4e9b\u4e0d\u89c4\u5219\u7684<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5206\u914d\u5230\u4e0d\u540c\u8fdb\u7a0b\u4e0a\u8fdb\u884c\u5408\u5e76\u3002\u6240\u6709\u9488\u5bf9\u8fd9\u4e9b\u4e0d\u89c4\u5219<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u7684 P2P \u901a\u4fe1\u7b49\u5f85\uff08Wait) \u4ee5\u53ca<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark> D2H \u590d\u5236\u64cd\u4f5c\u88ab\u63a8\u8fdf\u5230\u4ed6\u4eec\u5373\u5c06\u8fdb\u5165\u5e8f\u5217\u5316\u9636\u6bb5\u7684\u65f6\u5019\uff0c\u4ece\u800c\u6d88\u9664\u4e86\u9891\u7e41\u7684\u540c\u6b65\u5f00\u9500\uff0c\u4e5f\u589e\u52a0\u4e86\u901a\u4fe1\u4e0e\u5176\u4ed6 Checkpoint \u5b58\u50a8\u6d41\u7a0b\u7684\u6267\u884c\u91cd\u53e0\u5ea6\u3002<\/section>\n<section><\/section>\n<section><strong>\u7cfb\u7edf\u67b6\u6784<\/strong><\/section>\n<section><\/section>\n<section>\u4e0b\u56fe\u5c55\u793a\u4e86 ByteCheckpoint \u7684\u7cfb\u7edf\u67b6\u6784\uff1a<\/section>\n<section><\/section>\n<section>\u00a0API \u5c42\u4e3a\u4e0d\u540c\u8bad\u7ec3\u6846\u67b6\u63d0\u4f9b\u4e86\u7b80\u5355\uff0c\u6613\u7528\u4e14\u7edf\u4e00\u7684\u8bfb\u53d6\u548c\u5199\u5165 ( Save \uff09\u548c\u8bfb\u53d6\uff08 Load \uff09\u63a5\u53e3\u3002<\/section>\n<section><\/section>\n<section>Planner \u5c42\u4f1a\u6839\u636e\u5b58\u53d6\u5bf9\u8c61\u4e3a\u4e0d\u540c\u8bad\u7ec3\u8fdb\u7a0b\u751f\u6210\u5b58\u53d6\u65b9\u6848\uff0c\u4ea4\u7531 Execution \u5c42\u6267\u884c\u5b9e\u9645\u7684 I\/O \u4efb\u52a1\u3002<\/section>\n<section><\/section>\n<section>Execution \u5c42\u6267\u884c I\/O \u4efb\u52a1\u5e76\u4e0e Storage \u5c42\u8fdb\u884c\u4ea4\u4e92\uff0c\u5229\u7528\u5404\u79cd I\/O \u4f18\u5316\u6280\u672f\u8fdb\u884c\u9ad8\u6027\u80fd\u7684 Checkpoint \u5b58\u53d6\u3002<\/section>\n<section><\/section>\n<section>Storage \u5c42\u7ba1\u7406\u4e0d\u540c\u7684\u5b58\u50a8\u540e\u7aef\uff0c\u5e76\u5728 I\/O \u4efb\u52a1\u8fc7\u7a0b\u4e2d\u6839\u636e\u4e0d\u540c\u5b58\u50a8\u540e\u7aef\u8fdb\u884c\u76f8\u5e94\u7684\u4f18\u5316\u3002<\/section>\n<section><\/section>\n<section>\u5206\u5c42\u8bbe\u8ba1\u589e\u5f3a\u4e86\u7cfb\u7edf\u7684\u53ef\u6269\u5c55\u6027\uff0c\u4ee5\u4fbf\u672a\u6765\u652f\u6301\u66f4\u591a\u7684\u8bad\u7ec3\u6846\u67b6\u548c\u5b58\u50a8\u540e\u7aef\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-53820fd137df2c2e79d86606ec0e4709.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-53820fd137df2c2e79d86606ec0e4709.png\"><\/a><\/p>\n<section><strong>API \u7528\u4f8b<\/strong><\/section>\n<section><\/section>\n<section>ByteCheckpoint \u7684 API \u7528\u4f8b\u5982\u4e0b\uff1a<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-099fce6c26eddbe8abdbbaff83209ecd.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-099fce6c26eddbe8abdbbaff83209ecd.png\"><\/a><\/p>\n<section>ByteCheckpoint \u63d0\u4f9b\u4e86\u6781\u7b80 API \uff0c\u964d\u4f4e\u4e86\u7528\u6237\u4e0a\u624b\u7684\u6210\u672c\u3002\u7528\u6237\u5728\u5b58\u50a8\u548c\u8bfb\u53d6 Checkpoint \u65f6\uff0c\u53ea\u9700\u8981\u8c03\u7528\u5b58\u50a8\u548c\u52a0\u8f7d\u51fd\u6570\uff0c\u4f20\u5165\u9700\u8981\u5b58\u50a8\u548c\u8bfb\u53d6\u7684\u5185\u5bb9\uff0c\u6587\u4ef6\u7cfb\u7edf\u8def\u5f84\u548c\u5404\u79cd\u6027\u80fd\u4f18\u5316\u9009\u9879\u3002<\/section>\n<section><\/section>\n<section><strong>I\/O \u6027\u80fd\u4f18\u5316\u6280\u672f<\/strong><\/section>\n<section><\/section>\n<section><strong>Checkpoint \u5b58\u50a8\u4f18\u5316<\/strong><\/section>\n<section><\/section>\n<section>\u6d41\u6c34\u7ebf\u6267\u884c<\/section>\n<section><\/section>\n<section>\u5982\u4e0b\u56fe\u6240\u793a\uff0cByteCheckpoint \u8bbe\u8ba1\u4e86\u5168\u5f02\u6b65\u7684\u5b58\u50a8\u6d41\u6c34\u7ebf\uff08Save Pipeline\uff09\uff0c\u5c06 Checkpoint \u5b58\u50a8\u7684\u4e0d\u540c\u9636\u6bb5\uff08P2P <mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u4f20\u8f93\uff0cD2H \u590d\u5236\uff0c\u5e8f\u5217\u5316\uff0c\u4fdd\u5b58\u672c\u5730\u548c\u4e0a\u4f20\u6587\u4ef6\u7cfb\u7edf\uff09\u8fdb\u884c\u62c6\u5206\uff0c\u5b9e\u73b0\u9ad8\u6548\u7684\u6d41\u6c34\u7ebf\u6267\u884c\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d1f3b0e763ec709faff34f67546429c1.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d1f3b0e763ec709faff34f67546429c1.png\"><\/a><\/p>\n<section>\u907f\u514d\u5185\u5b58\u91cd\u590d\u5206\u914d<\/section>\n<section><\/section>\n<section>\u5728 D2H \u590d\u5236\u8fc7\u7a0b\uff0cByteCheckpoint \u91c7\u7528\u56fa\u5b9a\u5185\u5b58\u6c60\uff08 Pinned Memory Pool \uff09\uff0c\u51cf\u5c11\u4e86\u5185\u5b58\u53cd\u590d\u5206\u914d\u7684\u65f6\u95f4\u5f00\u9500\u3002<\/section>\n<section><\/section>\n<section>\u9664\u6b64\u4e4b\u5916\uff0c\u4e3a\u4e86\u964d\u4f4e\u9ad8\u9891\u5b58\u50a8\u573a\u666f\u4e2d\u56e0\u4e3a\u540c\u6b65\u7b49\u5f85\u56fa\u5b9a\u5185\u5b58\u6c60\u56de\u6536\u800c\u5e26\u6765\u7684\u989d\u5916\u65f6\u95f4\u5f00\u9500\uff0cByteCheckpoint \u5728\u56fa\u5b9a\u5185\u5b58\u6c60\u7684\u57fa\u7840\u4e0a\u52a0\u5165\u4e86 Ping-Pong buffering \u7684\u673a\u5236\u3002\u4e24\u4e2a\u72ec\u7acb\u7684\u5185\u5b58\u6c60\u4ea4\u66ff\u626e\u6f14\u7740\u8bfb\u5199 buffer \u7684\u89d2\u8272\uff0c\u4e0e GPU \u548c\u6267\u884c\u540e\u7eed I\/O \u64cd\u4f5c\u7684 I\/O workers \u8fdb\u884c\u4ea4\u4e92\uff0c\u8fdb\u4e00\u6b65\u63d0\u5347\u5b58\u50a8\u6548\u7387\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-47db15be5bd3b6083410509da601bd82.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-47db15be5bd3b6083410509da601bd82.png\"><\/a><\/p>\n<section>\u8d1f\u8f7d\u5747\u8861<\/section>\n<section><\/section>\n<section>\u5728\u6570\u636e\u5e76\u884c ( Data-Parallel or DP ) \u8bad\u7ec3\u4e2d\uff0c\u6a21\u578b\u5728\u4e0d\u540c\u7684\u6570\u636e\u5e76\u884c\u8fdb\u7a0b\u7ec4\uff08 DP Group \uff09\u4e4b\u95f4\u662f\u5197\u4f59\u7684\uff0c ByteCheckpoint \u91c7\u7528\u4e86\u8d1f\u8f7d\u5747\u8861\u7b97\u6cd5\u628a\u5197\u4f59\u7684\u6a21\u578b<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5747\u5300\u5206\u914d\u5230\u4e0d\u540c\u8fdb\u7a0b\u7ec4\u4e2d\u8fdb\u884c\u5b58\u50a8\uff0c\u6709\u6548\u5730\u63d0\u9ad8\u4e86 Checkpoint \u5b58\u50a8\u6548\u7387\u3002<\/section>\n<section><\/section>\n<section><strong>Checkpoint \u8bfb\u53d6\u4f18\u5316<\/strong><\/section>\n<section><strong><br \/><\/strong><\/section>\n<section>\u96f6\u5197\u4f59\u52a0\u8f7d<\/section>\n<section><\/section>\n<section>\u5982\u56fe\u6240\u793a\uff0c\u5728\u6539\u53d8\u5e76\u884c\u5ea6\u8bfb\u53d6 Checkpoint \u65f6\uff0c\u65b0\u7684\u8bad\u7ec3\u8fdb\u7a0b\u53ef\u80fd\u53ea\u9700\u8981\u4ece\u539f\u6765\u7684<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247\u4e2d\u8bfb\u53d6\u5176\u4e2d\u7684\u4e00\u90e8\u5206\u3002<\/section>\n<section><\/section>\n<section>ByteCheckpoint \u91c7\u7528\u6309\u9700\u90e8\u5206\u6587\u4ef6\u8bfb\u53d6\uff08 Partial File Reading \uff09 \u6280\u672f\uff0c\u76f4\u63a5\u4ece\u8fdc\u7a0b\u5b58\u50a8\u4e2d\u8bfb\u53d6\u9700\u8981\u7684\u6587\u4ef6\u7247\u6bb5\uff0c\u907f\u514d\u4e0b\u8f7d\u548c\u8bfb\u53d6\u4e0d\u5fc5\u8981\u7684\u6570\u636e\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-98c19ae70891127814b8d123c610cf76.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-98c19ae70891127814b8d123c610cf76.png\"><\/a><\/p>\n<section>\u5728\u6570\u636e\u5e76\u884c (Data-Parallel or DP) \u8bad\u7ec3\u4e2d\uff0c\u6a21\u578b\u5728\u4e0d\u540c\u7684\u6570\u636e\u5e76\u884c\u8fdb\u7a0b\u7ec4\uff08DP Group\uff09\u4e4b\u95f4\u662f\u5197\u4f59\u7684\uff0c\u4e0d\u540c\u8fdb\u7a0b\u7ec4\u4f1a\u91cd\u590d\u8bfb\u53d6\u540c\u4e00\u4e2a<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247\u3002\u5728\u5927\u89c4\u6a21\u8bad\u7ec3\u7684\u573a\u666f\u4e0b\uff0c\u4e0d\u540c\u8fdb\u7a0b\u7ec4\u540c\u65f6\u53d1\u7ed9\u8fdc\u7a0b\u6301\u4e45\u5316\u5b58\u50a8\u7cfb\u7edf \uff08\u6bd4\u5982 HDFS \uff09\u5927\u91cf\u8bf7\u6c42\uff0c\u4f1a\u7ed9\u5b58\u50a8\u7cfb\u7edf\u5e26\u6765\u5de8\u5927\u538b\u529b\u3002<\/section>\n<section><\/section>\n<section>\u4e3a\u4e86\u6d88\u9664\u91cd\u590d\u6570\u636e\u8bfb\u53d6\uff0c\u51cf\u5c11\u8bad\u7ec3\u8fdb\u7a0b\u53d1\u7ed9 HDFS \u7684\u8bf7\u6c42\uff0c\u4f18\u5316\u52a0\u8f7d\u7684\u6027\u80fd\uff0cByteCheckpoint \u628a\u76f8\u540c\u7684<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247\u8bfb\u53d6\u4efb\u52a1\u5747\u5300\u5206\u914d\u5230\u4e0d\u540c\u8fdb\u7a0b\u4e0a\uff0c\u5e76\u5728\u5bf9\u8fdc\u7a0b\u6587\u4ef6\u8fdb\u884c\u8bfb\u53d6\u7684\u540c\u65f6\uff0c\u5229\u7528 GPU \u4e4b\u95f4\u95f2\u7f6e\u7684\u5e26\u5bbd\u8fdb\u884c<mark data-type=\"concepts\" data-id=\"64cc669a-900a-449c-ac73-f71d0e91fc86\">\u5f20\u91cf<\/mark>\u5207\u7247\u4f20\u8f93\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-452a7a70d6f4eb5e620bb8fa62a02b26.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-452a7a70d6f4eb5e620bb8fa62a02b26.png\"><\/a><\/p>\n<section><strong>\u5b9e\u9a8c\u7ed3\u679c<\/strong><\/section>\n<section><\/section>\n<section><strong>\u5b9e\u9a8c\u914d\u7f6e<\/strong><\/section>\n<section><\/section>\n<section>\u56e2\u961f\u4f7f\u7528 DenseGPT \u4e0e SparseGPT \u6a21\u578b (\u57fa\u4e8e GPT-3 [10] \u7ed3\u6784\u5b9e\u73b0)\uff0c\u5728\u4e0d\u540c\u6a21\u578b<mark data-type=\"concepts\" data-id=\"2e982b73-88e2-41e8-a430-f7ae5a9af4bf\">\u53c2\u6570<\/mark>\u91cf\uff0c\u4e0d\u540c\u8bad\u7ec3\u6846\u67b6\u548c\u4e0d\u540c\u89c4\u6a21\u7684\u8bad\u7ec3\u4efb\u52a1\u4e2d\u8bc4\u4f30\u4e86 ByteCheckpoint \u7684 Checkpoint \u5b58\u53d6\u6b63\u786e\u6027\u3001\u5b58\u50a8\u6027\u80fd\u548c\u8bfb\u53d6\u6027\u80fd\u3002\u66f4\u591a\u5b9e\u9a8c\u914d\u7f6e\u548c\u6b63\u786e\u6027\u6d4b\u8bd5\u7ec6\u8282\u8bf7\u79fb\u6b65\u5b8c\u6574\u8bba\u6587\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-eba019f5b2126c985028e680b16756c8.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-eba019f5b2126c985028e680b16756c8.png\"><\/a><\/p>\n<section><strong>\u5b58\u50a8\u6027\u80fd\u6d4b\u8bd5<\/strong><\/section>\n<section><strong><br \/><\/strong><\/section>\n<section>\u5728\u5b58\u50a8\u6027\u80fd\u6d4b\u8bd5\u4e2d\uff0c\u56e2\u961f\u6bd4\u8f83\u4e86\u4e0d\u540c\u6a21\u578b\u89c4\u6a21\u548c\u8bad\u7ec3\u6846\u67b6\uff0c\u5728\u8bad\u7ec3\u8fc7\u7a0b\u4e2d\u6bcf 50 \u6216\u8005 100 \u6b65\u5b58\u4e00\u6b21 Checkpoint \uff0c Bytecheckpoint \u548c\u57fa\u7ebf\uff08 Baseline \uff09\u65b9\u6cd5\u7ed9\u8bad\u7ec3\u5e26\u6765\u7684\u603b\u7684\u963b\u585e\u65f6\u95f4 ( Checkpoint stalls )\u3002<\/section>\n<section><\/section>\n<section>\u5f97\u76ca\u4e8e\u5bf9\u5199\u5165\u6027\u80fd\u7684\u6df1\u5ea6\u4f18\u5316\uff0cByteCheckpoint \u5728\u5404\u7c7b\u5b9e\u9a8c\u573a\u666f\u4e2d\u5747\u53d6\u5f97\u4e86\u5f88\u9ad8\u7684\u8868\u73b0\uff0c\u5728 576 \u5361 SparseGPT 110B &#8211; Megatron-LM \u8bad\u7ec3\u4efb\u52a1\u4e2d\u76f8\u6bd4\u57fa\u7ebf\u5b58\u50a8\u65b9\u6cd5\u53d6\u5f97\u4e86 66.65~74.55 \u500d\u7684\u6027\u80fd\u63d0\u5347\uff0c\u5728 256 \u5361 DenseGPT 10B &#8211; FSDP \u8bad\u7ec3\u4efb\u52a1\u4e2d\u751a\u81f3\u80fd\u8fbe\u5230 529.22 \u500d\u7684\u6027\u80fd\u63d0\u5347\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-54cfb92828cf43f87e34c82d28ebbbe0.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-54cfb92828cf43f87e34c82d28ebbbe0.png\"><\/a><\/p>\n<section><strong>\u8bfb\u53d6\u6027\u80fd\u6d4b\u8bd5<\/strong><\/section>\n<section><\/section>\n<section>\u5728\u8bfb\u53d6\u6027\u80fd\u6d4b\u8bd5\u4e2d\uff0c\u56e2\u961f\u6bd4\u8f83\u4e0d\u540c\u65b9\u6cd5\u6839\u636e\u4e0b\u6e38\u4efb\u52a1\u5e76\u884c\u5ea6\u8bfb\u53d6 Checkpoint \u7684\u52a0\u8f7d\u65f6\u95f4\u3002ByteCheckpoint \u76f8\u6bd4\u57fa\u7ebf\u65b9\u6cd5\u53d6\u5f97\u4e86 1.55 \uff5e 3.37 \u500d\u7684\u6027\u80fd\u63d0\u5347\u3002<\/section>\n<section><\/section>\n<section>\u56e2\u961f\u89c2\u5bdf\u5230 ByteCheckpoint \u76f8\u5bf9\u4e8e Megatron-LM \u57fa\u7ebf\u65b9\u6cd5\u7684\u6027\u80fd\u63d0\u5347\u66f4\u4e3a\u663e\u8457\u3002\u8fd9\u662f\u56e0\u4e3a Megatron-LM \u5728\u8bfb\u53d6 Checkpoint \u5230\u65b0\u7684\u5e76\u884c\u5ea6\u914d\u7f6e\u4e4b\u524d\uff0c\u9700\u8981\u8fd0\u884c\u79bb\u7ebf\u7684\u811a\u672c\u5bf9\u5206\u5e03\u5f0f Checkpoint \u8fdb\u884c\u91cd\u65b0\u5206\u7247\u3002\u76f8\u6bd4\u4e4b\u4e0b\uff0cByteCheckpoint \u80fd\u591f\u76f4\u63a5\u8fdb\u884c\u81ea\u52a8 Checkpoint \u91cd\u65b0\u5207\u5206\uff0c\u65e0\u9700\u8fd0\u884c\u79bb\u7ebf\u811a\u672c\uff0c\u9ad8\u6548\u5b8c\u6210\u8bfb\u53d6\u3002<\/section>\n<p><a href=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-ba6616cca8fa465557164fb75d3bf1a3.png\" data-fancybox=\"images\" data-fancybox=\"gallery\"><img decoding=\"async\" src=\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-ba6616cca8fa465557164fb75d3bf1a3.png\"><\/a><\/p>\n<section>\u6700\u540e\uff0c\u5173\u4e8e ByteCheckpoint \u7684\u672a\u6765<mark data-type=\"tech_tasks\" data-id=\"3f5eac69-dad3-43e7-9022-40dcf97a1892\">\u89c4\u5212<\/mark>\uff0c\u56e2\u961f\u5e0c\u671b\u4ece\u4e24\u4e2a\u65b9\u9762\u7740\u624b\uff1a<\/section>\n<section><\/section>\n<section>\u5176\u4e00\uff0c\u5b9e\u73b0\u652f\u6301\u8d85\u5927\u89c4\u6a21 GPU \u96c6\u7fa4\u8bad\u7ec3\u4efb\u52a1\u9ad8\u6548 Checkpointing \u7684\u957f\u8fdc\u76ee\u6807\u3002<\/section>\n<section><\/section>\n<section>\u5176\u4e8c\uff0c\u5b9e\u73b0\u5927\u6a21\u578b\u8bad\u7ec3\u5168\u751f\u547d\u5468\u671f\u7684 Checkpoint \u7ba1\u7406\uff0c\u652f\u6301\u5168\u573a\u666f\u7684 Checkpoint \uff0c\u4ece\u9884\u8bad\u7ec3\uff08Pre-Training)\uff0c\u5230\u76d1\u7763\u5fae\u8c03\uff08 SFT \uff09\uff0c\u518d\u5230<mark data-type=\"tech_methods\" data-id=\"ee1a8f69-3170-4ddf-b2b6-47d91c844425\">\u5f3a\u5316\u5b66\u4e60<\/mark>\uff08 RLHF \uff09\u548c\u8bc4\u4f30 (Evaluation) \u7b49\u573a\u666f\u3002<\/section>\n<section><\/section>\n<section><strong>\u56e2\u961f\u4ecb\u7ecd<\/strong><\/section>\n<section><\/section>\n<section><mark data-type=\"institutions\" data-id=\"7092494f-e4a9-4175-8efe-b5ddb66a9878\">\u5b57\u8282\u8df3\u52a8<\/mark>\u8c46\u5305\u5927\u6a21\u578b\u56e2\u961f\u6210\u7acb\u4e8e 2023 \u5e74\uff0c\u81f4\u529b\u4e8e\u5f00\u53d1\u4e1a\u754c\u6700\u5148\u8fdb\u7684 AI \u5927\u6a21\u578b\u6280\u672f\uff0c\u6210\u4e3a\u4e16\u754c\u4e00\u6d41\u7684\u7814\u7a76\u56e2\u961f\uff0c\u4e3a\u79d1\u6280\u548c\u793e\u4f1a\u53d1\u5c55\u4f5c\u51fa\u8d21\u732e\u3002<\/section>\n<section><\/section>\n<section>\u76ee\u524d\uff0c\u56e2\u961f\u6b63\u5728\u6301\u7eed\u5438\u5f15\u4f18\u79c0\u4eba\u624d\u52a0\u5165\uff0c\u786c\u6838\u3001\u5f00\u653e\u4e14\u5145\u6ee1\u521b\u65b0\u7cbe\u795e\u662f\u56e2\u961f\u6c1b\u56f4\u5173\u952e\u8bcd\uff0c\u56e2\u961f\u81f4\u529b\u4e8e\u521b\u9020\u4e00\u4e2a\u79ef\u6781\u5411\u4e0a\u7684\u5de5\u4f5c\u73af\u5883\uff0c\u9f13\u52b1\u56e2\u961f\u6210\u5458\u4e0d\u65ad\u5b66\u4e60\u548c\u6210\u957f\uff0c\u4e0d\u754f\u6311\u6218\uff0c\u8ffd\u6c42\u5353\u8d8a\u3002<\/section>\n<section><\/section>\n<section>\u5e0c\u671b\u4e0e\u5177\u5907\u521b\u65b0\u7cbe\u795e\u3001\u8d23\u4efb\u5fc3\u7684\u6280\u672f\u4eba\u624d\u4e00\u8d77\uff0c\u63a8\u8fdb\u5927\u6a21\u578b\u8bad\u7ec3\u63d0\u6548\u5de5\u4f5c\u53d6\u5f97\u66f4\u591a\u8fdb\u5c55\u548c\u6210\u679c\u3002<\/section>\n<section><\/section>\n<section><em><sup>\u53c2\u8003\u6587\u732e<\/sup><\/em><\/section>\n<section><sup><em>[1] Mohan, Jayashree, Amar Phanishayee, and Vijay Chidambaram. &#8220;{CheckFreq}: Frequent,{Fine-Grained}{DNN} Checkpointing.&#8221; 19th USENIX Conference on File and Storage Technologies (FAST 21). 2021.<\/em><\/sup><\/section>\n<section><sup><em>[2] Eisenman, Assaf, et al. &#8220;{Check-N-Run}: A Checkpointing system for training deep learning recommendation models.&#8221; 19th USENIX Symposium on Networked Systems Design and Implementation (NSDI 22). 2022.<\/em><\/sup><\/section>\n<section><sup><em>[3] Wang, Zhuang, et al. &#8220;Gemini: Fast failure recovery in \u5206\u5e03\u5f0f training with in-memory Checkpoints.&#8221; Proceedings of the 29th Symposium on Operating Systems Principles. 2023.<\/em><\/sup><\/section>\n<section><sup><em>[4] Gupta, Tanmaey, et al. &#8220;Just-In-Time Checkpointing: Low Cost Error Recovery from Deep Learning Training Failures.&#8221; Proceedings of the Nineteenth European Conference on Computer Systems. 2024.<\/em><\/sup><\/section>\n<section><sup><em>[5] Shoeybi, Mohammad, et al. &#8220;Megatron-lm: Training multi-billion parameter language models using model parallelism.&#8221; arXiv preprint arXiv:1909.08053 (2019).<\/em><\/sup><\/section>\n<section><sup><em>[6] Zhao, Yanli, et al. &#8220;Pytorch fsdp: experiences on scaling fully sharded data parallel.&#8221; arXiv preprint arXiv:2304.11277 (2023).<\/em><\/sup><\/section>\n<section><sup><em>[7] Rasley, Jeff, et al. &#8220;Deepspeed: System optimizations enable training deep learning models with over 100 billion parameters.&#8221; Proceedings of the 26th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining. 2020.<\/em><\/sup><\/section>\n<section><sup><em>[8] Jiang, Ziheng, et al. &#8220;{MegaScale}: Scaling large language model training to more than 10,000 {GPUs}.&#8221; 21st USENIX Symposium on Networked Systems Design and Implementation (NSDI 24). 2024.<\/em><\/sup><\/section>\n<section><sup><em>[9] veScale: A PyTorch Native LLM Training Framework https:\/\/github.com\/volcengine\/veScale<\/em><\/sup><\/section>\n<section><em><sup>[10] Brown, Tom, et al. &#8220;Language models are few-shot learners.&#8221; Advances in neural information processing systems 33 (2020): 1877-1901.<\/sup><\/em><\/section>\n<p>\u6587\u7ae0\u6765\u6e90\u4e8e\u4e92\u8054\u7f51:<a href=\"https:\/\/www.jiqizhixin.com\/articles\/2024-08-08-7\" target=\"_blank\">Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548<\/a><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u6587\u7ae0\u6765\u6e90\u4e8e\u4e92\u8054\u7f51:Llama3\u8bad\u7ec3\u6bcf3\u5c0f [&hellip;]<\/p>\n","protected":false},"author":3,"featured_media":0,"comment_status":"open","ping_status":"","sticky":false,"template":"","format":"standard","meta":{"site-sidebar-layout":"default","site-content-layout":"","ast-site-content-layout":"","site-content-style":"default","site-sidebar-style":"default","ast-global-header-display":"","ast-banner-title-visibility":"","ast-main-header-display":"","ast-hfb-above-header-display":"","ast-hfb-below-header-display":"","ast-hfb-mobile-header-display":"","site-post-title":"","ast-breadcrumbs-content":"","ast-featured-img":"","footer-sml-layout":"","theme-transparent-header-meta":"","adv-header-id-meta":"","stick-header-meta":"","header-above-stick-meta":"","header-main-stick-meta":"","header-below-stick-meta":"","astra-migrate-meta-layouts":"default","ast-page-background-enabled":"default","ast-page-background-meta":{"desktop":{"background-color":"var(--ast-global-color-4)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"ast-content-background-meta":{"desktop":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"footnotes":""},"categories":[27],"tags":[71,68],"class_list":["post-34993","post","type-post","status-publish","format-standard","hentry","category-news","tag-rag","tag-68"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v26.4 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548 - \u4e00\u8d77AI\u6280\u672f<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/17aitech.com\/?p=34993\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/17aitech.com\/?p=34993\",\"url\":\"https:\/\/17aitech.com\/?p=34993\",\"name\":\"Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548 - \u4e00\u8d77AI\u6280\u672f\",\"isPartOf\":{\"@id\":\"https:\/\/17aitech.com\/#website\"},\"primaryImageOfPage\":{\"@id\":\"https:\/\/17aitech.com\/?p=34993#primaryimage\"},\"image\":{\"@id\":\"https:\/\/17aitech.com\/?p=34993#primaryimage\"},\"thumbnailUrl\":\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png\",\"datePublished\":\"2024-12-16T06:58:56+00:00\",\"author\":{\"@id\":\"https:\/\/17aitech.com\/#\/schema\/person\/60225458499e817ae0af73e67e440b9d\"},\"breadcrumb\":{\"@id\":\"https:\/\/17aitech.com\/?p=34993#breadcrumb\"},\"inLanguage\":\"zh-Hans\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/17aitech.com\/?p=34993\"]}]},{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/17aitech.com\/?p=34993#primaryimage\",\"url\":\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png\",\"contentUrl\":\"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png\"},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/17aitech.com\/?p=34993#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u9996\u9875\",\"item\":\"https:\/\/17aitech.com\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/17aitech.com\/#website\",\"url\":\"https:\/\/17aitech.com\/\",\"name\":\"\u4e00\u8d77AI\u6280\u672f\",\"description\":\"\u8ba9AI\u77e5\u8bc6\u89e6\u624b\u53ef\u53ca\",\"alternateName\":\"\u4e00\u8d77AI\u6280\u672f\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/17aitech.com\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"zh-Hans\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/17aitech.com\/#\/schema\/person\/60225458499e817ae0af73e67e440b9d\",\"name\":\"AI\u5c0f\u52a9\u624b\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"zh-Hans\",\"@id\":\"https:\/\/17aitech.com\/#\/schema\/person\/image\/\",\"url\":\"\/\/17aitech.com\/wp-content\/uploads\/2024\/04\/robot_3.png\",\"contentUrl\":\"\/\/17aitech.com\/wp-content\/uploads\/2024\/04\/robot_3.png\",\"caption\":\"AI\u5c0f\u52a9\u624b\"},\"description\":\"\u8fd9\u4e2a\u4eba\u5f88\u61d2\uff0c\u4ec0\u4e48\u90fd\u6ca1\u6709\u7559\u4e0b\uff5e\",\"url\":\"https:\/\/17aitech.com\/?page_id=33738&user=3\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548 - \u4e00\u8d77AI\u6280\u672f","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/17aitech.com\/?p=34993","schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/17aitech.com\/?p=34993","url":"https:\/\/17aitech.com\/?p=34993","name":"Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548 - \u4e00\u8d77AI\u6280\u672f","isPartOf":{"@id":"https:\/\/17aitech.com\/#website"},"primaryImageOfPage":{"@id":"https:\/\/17aitech.com\/?p=34993#primaryimage"},"image":{"@id":"https:\/\/17aitech.com\/?p=34993#primaryimage"},"thumbnailUrl":"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png","datePublished":"2024-12-16T06:58:56+00:00","author":{"@id":"https:\/\/17aitech.com\/#\/schema\/person\/60225458499e817ae0af73e67e440b9d"},"breadcrumb":{"@id":"https:\/\/17aitech.com\/?p=34993#breadcrumb"},"inLanguage":"zh-Hans","potentialAction":[{"@type":"ReadAction","target":["https:\/\/17aitech.com\/?p=34993"]}]},{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/17aitech.com\/?p=34993#primaryimage","url":"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png","contentUrl":"https:\/\/17aitech.com\/wp-content\/uploads\/2024\/08\/frc-d9f08060ac50dd1443252f63d2b30c0c.png"},{"@type":"BreadcrumbList","@id":"https:\/\/17aitech.com\/?p=34993#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u9996\u9875","item":"https:\/\/17aitech.com\/"},{"@type":"ListItem","position":2,"name":"Llama3\u8bad\u7ec3\u6bcf3\u5c0f\u65f6\u5d29\u4e00\u6b21\uff1f\u8c46\u5305\u5927\u6a21\u578b\u3001\u6e2f\u5927\u56e2\u961f\u4e3a\u8106\u76ae\u4e07\u5361\u8bad\u7ec3\u63d0\u6548"}]},{"@type":"WebSite","@id":"https:\/\/17aitech.com\/#website","url":"https:\/\/17aitech.com\/","name":"\u4e00\u8d77AI\u6280\u672f","description":"\u8ba9AI\u77e5\u8bc6\u89e6\u624b\u53ef\u53ca","alternateName":"\u4e00\u8d77AI\u6280\u672f","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/17aitech.com\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"zh-Hans"},{"@type":"Person","@id":"https:\/\/17aitech.com\/#\/schema\/person\/60225458499e817ae0af73e67e440b9d","name":"AI\u5c0f\u52a9\u624b","image":{"@type":"ImageObject","inLanguage":"zh-Hans","@id":"https:\/\/17aitech.com\/#\/schema\/person\/image\/","url":"\/\/17aitech.com\/wp-content\/uploads\/2024\/04\/robot_3.png","contentUrl":"\/\/17aitech.com\/wp-content\/uploads\/2024\/04\/robot_3.png","caption":"AI\u5c0f\u52a9\u624b"},"description":"\u8fd9\u4e2a\u4eba\u5f88\u61d2\uff0c\u4ec0\u4e48\u90fd\u6ca1\u6709\u7559\u4e0b\uff5e","url":"https:\/\/17aitech.com\/?page_id=33738&user=3"}]}},"_links":{"self":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/posts\/34993","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=34993"}],"version-history":[{"count":0,"href":"https:\/\/17aitech.com\/index.php?rest_route=\/wp\/v2\/posts\/34993\/revisions"}],"wp:attachment":[{"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=34993"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=34993"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/17aitech.com\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=34993"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}