{"id":19891,"date":"2025-08-07T11:53:24","date_gmt":"2025-08-07T03:53:24","guid":{"rendered":"https:\/\/aicats.wiki\/sites\/19891.html"},"modified":"2025-08-07T11:53:24","modified_gmt":"2025-08-07T03:53:24","slug":"deepspeed","status":"publish","type":"sites","link":"https:\/\/aicats.wiki\/tw\/sites\/19891-html","title":{"rendered":"DeepSpeed"},"content":{"rendered":"<p>2024\u5e746\u6708\uff0c\u4eba\u5de5\u667a\u80fd\u5927\u8bed\u8a00\u6a21\u578b\u6b65\u5165\u89c4\u6a21\u5316\u65f6\u4ee3\u3002DeepSpeed\uff0c\u7531\u5fae\u8f6f\u7814\u53d1\u5e76\u5f00\u6e90\uff0c\u4ee5\u5176\u5353\u8d8a\u7684\u4f18\u5316\u6280\u672f\u6210\u4e3a\u5168\u7403<a class=\"external\" href=\"https:\/\/aicats.wiki\/tw\/tag\/ai\" title=\"\u67e5\u770b\u8207 AI \u76f8\u95dc\u7684\u6587\u7ae0\" target=\"_blank\">AI<\/a>\u5f00\u53d1\u8005\u7684\u91cd\u8981\u5de5\u5177\u3002<strong>DeepSpeed<\/strong>\u5177\u5099\u9ad8\u6548\u7387\u7684\u591aGPU\u3001\u591a\u6a5f\u5206\u6563\u5f0f\u8a13\u7df4\u80fd\u529b\uff0c\u4f7f\u5f97\u5927\u898f\u6a21<a href=\"https:\/\/aicats.wiki\/tw\/sites\/20475-html\/\" title=\"LOBE\">AI\u6a21\u578b\u8a13\u7df4<\/a>\u66f4\u4e3a\u9ad8\u6548\u3001\u6210\u672c\u66f4\u4f4e\u3002\u5176\u6838\u5fc3\u6280\u672f\u5305\u62ecDeepSpeed-Tr<a class=\"external\" href=\"https:\/\/aicats.wiki\/tw\/sitetag\/ai\" title=\"\u67e5\u770b\u8207 ai \u76f8\u95dc\u7684\u6587\u7ae0\" target=\"_blank\">ai<\/a>ning\u3001DeepSpeed-Inference\u3001DeepSpeed-Compression\u4ee5\u53caDeepSpeed4Science\u56db\u5927\u652f\u67f1\u3002\u7528\u6237\u53ef\u4ee5\u5728\u672c\u5730\u6216Azure\u4e91\u7aef\u90e8\u7f72\uff0c\u4f53\u9a8c\u514d\u8d39\u4e14\u9ad8\u6027\u80fd\u7684AI\u6a21\u578b\u8bad\u7ec3\u3002<\/p>\n\n\n\n<p>2024\u5e746\u6708\uff0c\u4eba\u5de5\u667a\u6167\u5927\u8a9e\u8a00\u6a21\u578b\u72c2\u98c6\u7a81\u9032\uff0c\u5f9eGPT-4\u3001BLOOM\u5230\u6700\u65b0\u7684\u4f01\u696d\u7d1a\u61c9\u7528\uff0c<strong>\u5927\u898f\u6a21AI\u8a13\u7df4\u6a21\u578b<\/strong>\u5df2\u6210\u70ba\u696d\u754c\u529b\u722d\u9ad8\u5730\u3002\u96a8\u8457\u6a21\u578b\u53c3\u6578\u91cf\u6b65\u5165\u6578\u5341\u5104\uff0c\u751a\u81f3\u6578\u5343\u5104\u7d1a\uff0c\u8a13\u7df4\u548c\u63a8\u7406\u7684\u6210\u672c\u8207\u96e3\u5ea6\u4e5f\u5448\u6307\u6578\u7d1a\u589e\u9577\u3002\u7531\u5fae\u8edf\u7814\u767c\u4e26\u958b\u6e90\u7684<strong>DeepSpeed<\/strong>\uff0c\u6b63\u4ee5\u5176\u6975\u81f4\u7684\u512a\u5316\u6280\u8853\uff0c\u5fb9\u5e95\u6539\u8b8a\u9019\u4e00\u5c40\u9762\uff0c\u6210\u70ba\u5168\u7403AI\u958b\u767c\u8005\u4e0d\u53ef\u6216\u7f3a\u7684\u300c\u57fa\u790e\u8a2d\u65bd\u300d\u3002<\/p>\n\n\n\n<blockquote class=\"wp-block-quote is-layout-flow wp-block-quote-is-layout-flow\">\n<p>\u9020\u8a2aDeepSpeed\u5b98\u65b9\u7db2\u7ad9\uff1a<a href=\"https:\/\/www.deepspeed.ai\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >https:\/\/www.deepspeed.ai\/<\/a><\/p>\n<\/blockquote>\n\n\n\n<figure class=\"wp-block-image size-full\"><img fetchpriority=\"high\" decoding=\"async\" width=\"1595\" height=\"918\" src=\"https:\/\/aicats.wiki\/wp-content\/uploads\/2025\/08\/image-211.png\" alt=\"DeepSpeed\u5b98\u7db2\u622a\u5716\" class=\"wp-image-23623\"\/><figcaption class=\"wp-element-caption\">\u5716\uff0f<a href=\"https:\/\/www.deepspeed.ai\/getting-started\/\" title=\"\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >DeepSpeed\u5b98\u7db2\u622a\u5716<\/a><\/figcaption><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">\u4ec0\u9ebc\u662fDeepSpeed\uff1f<\/h2>\n\n\n\n<p><strong>DeepSpeed<\/strong> \u662f\u4e00\u6b3e\u6df1\u5ea6\u5b78\u7fd2\u512a\u5316\u8edf\u9ad4\u5957\u4ef6\uff08Deep Learning Optimization Software Suite\uff09\uff0c\u5c08\u70ba\u8a13\u7df4\u548c\u63a8\u7406\u8d85\u5927\u898f\u6a21\u6a21\u578b\u6253\u9020\uff0c\u666e\u904d\u61c9\u7528\u65bc\u5982MT-NLG\u3001BLOOM\u3001Jurassic-1\u7b49\u9802\u7d1a\u5927\u578b\u6a21\u578b\u7684\u8a13\u7df4\u5834\u666f\u3002 DeepSpeed\u8ffd\u6c42\u6975\u81f4\u9ad8\u6548\uff0c\u4e3b\u6253\u5728\u591aGPU\u3001\u591a\u6a5f\u5206\u6563\u5f0f\u74b0\u5883\u4e2d\uff0c\u5c07\u8a13\u7df4\u901f\u5ea6\u6700\u5927\u5316\u3001\u8cc7\u6e90\u5229\u7528\u6700\u512a\u3001\u6210\u672c\u5927\u5e45\u964d\u4f4e\u3002<br>\n\u5b83\u4e0d\u50c5\u9069\u7528\u65bc\u5927\u6a21\u578b\uff0c\u4e5f\u80fd\u8b93\u4e2d\u5c0f\u578b\u5718\u968a\u5728\u66f4\u5e73\u50f9\u786c\u9ad4\u4e0a\u5b8c\u6210\u4ee5\u5f80\u9700\u300c\u5de8\u7121\u9738\u300d\u4f3a\u670d\u5668\u53e2\u96c6\u7684\u4efb\u52d9\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">DeepSpeed\u7684\u4e3b\u8981\u529f\u80fd<\/h2>\n\n\n\n<h3 class=\"wp-block-heading\">\u6280\u8853\u5275\u65b0\u56db\u5927\u652f\u67f1<\/h3>\n\n\n\n<p>DeepSpeed\u7684\u6838\u5fc3\u5275\u65b0\u5206\u70ba\u56db\u5927\u652f\u67f1\uff0c\u6bcf\u4e00\u9805\u90fd\u91dd\u5c0dAI\u8a13\u7df4\u8207\u63a8\u7406\u4e2d\u7684\u75db\u9ede\uff1a<\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>\u652f\u67f1<\/th><th>\u4e3b\u8981\u529f\u80fd<\/th><\/tr><\/thead><tbody><tr><td><strong>DeepSpeed-Training<\/strong><\/td><td>\u8a2d\u8a08\u7528\u65bc\u7a81\u7834\u6027\u7684\u5927\u898f\u6a21\u5e73\u884c\u8a13\u7df4\uff08\u5982ZeRO\u30013D-Parallelism\u3001Mixture-of-Experts\u3001ZeRO-Infinity\u7b49\uff09\uff0c\u5927\u5e45\u63d0\u5347\u8a13\u7df4\u6548\u7387\u8207\u898f\u6a21\u3002<\/td><\/tr><tr><td><strong>DeepSpeed-Inference<\/strong><\/td><td>\u900f\u904e\u5f35\u91cf\u3001\u7ba1\u7dda\u3001\u5c08\u5bb6\u6a21\u578b\u3001ZeRO\u7b49\u591a\u7a2e\u5e73\u884c\u6280\u8853\u548c\u6838\u5fc3\u512a\u5316\uff0c\u5be6\u73fe\u8d85\u5927\u6a21\u578b\u7684\u9ad8\u6548\u4f4e\u5ef6\u9072\u63a8\u7406\u3002<\/td><\/tr><tr><td><strong>DeepSpeed-Compression<\/strong><\/td><td>\u63d0\u4f9b\u6613\u7528\u3001\u9ad8\u9748\u6d3b\u5ea6\u7684\u6a21\u578b\u58d3\u7e2e\u65b9\u6848\uff08\u5982ZeroQuant\u3001XTC\u7b49\uff09\uff0c\u5728\u4e0d\u5f71\u97ff\u8868\u73fe\u4e0b\u5927\u5e45\u6e1b\u5c11\u6a21\u578b\u9ad4\u7a4d\u3001\u52a0\u901f\u63a8\u7406\u901f\u5ea6\u3001\u7bc0\u7701\u6210\u672c\u3002<\/td><\/tr><tr><td><strong>DeepSpeed4Science<\/strong><\/td><td>\u7d50\u5408\u7cfb\u7d71\u512a\u5316\u8207\u79d1\u5b78\u7b97\u529b\uff0c\u5354\u52a9\u751f\u547d\u79d1\u5b78\u3001\u7269\u7406\u7b49\u524d\u6cbf\u9818\u57df\uff0c\u5927\u5e45\u63d0\u6607\u79d1\u7814AI\u6a21\u578b\u7684\u8a13\u7df4\u6548\u7387\u3002<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<p>\u8a73\u7d30\u6280\u8853\u4ecb\u7d39\u53ef\u67e5\u95b1 <a href=\"https:\/\/www.deepspeed.ai\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >DeepSpeed\u6280\u8853\u652f\u67f1\u9801\u9762<\/a>\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img decoding=\"async\" width=\"1595\" height=\"918\" src=\"https:\/\/aicats.wiki\/wp-content\/uploads\/2025\/08\/image-212.png\" alt=\" DeepSpeed\u6280\u8853\u652f\u67f1\u9801\u9762\" class=\"wp-image-23628\"\/><figcaption class=\"wp-element-caption\">\u5716\uff0f <a href=\"https:\/\/www.deepspeed.ai\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >DeepSpeed\u6280\u8853\u652f\u67f1\u9801\u9762<\/a><\/figcaption><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\">DeepSpeed-Training<\/h3>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u7a81\u7834\u6027\u5206\u6563\u5f0f\u8a13\u7df4\u512a\u5316<\/strong>\uff0c\u5982ZeRO\u7cfb\u5217\u512a\u5316\u5668\uff0c\u4f7f\u591a\u7bc0\u9ede\u6578\u5343GPU\u4e0a\u7dda\u6027\u64f4\u5c55\uff0c\u8f15\u9b06\u652f\u6490\u5343\u5104\u53c3\u6578\u6a21\u578b\u8a13\u7df4\u3002<\/li>\n\n\n\n<li><strong>3D-Parallelism<\/strong>\uff0c\u5be6\u73fe\u5f35\u91cf\u3001\u7ba1\u7dda\u3001\u8cc7\u6599\u4e09\u7dad\u4e26\u884c\uff0c\u6975\u81f4\u6316\u6398\u8a08\u7b97\u8207\u8a18\u61b6\u9ad4\u983b\u5bec\u3002<\/li>\n\n\n\n<li><strong>MoE\uff08\u5c08\u5bb6\u6a21\u578b\uff09\u8a13\u7df4\u512a\u5316<\/strong>\uff0c\u81ea\u52d5\u7ba1\u7406\u7a00\u758f\u555f\u52d5\u5927\u6a21\u578b\uff0c\u8a13\u7df4\u7a00\u758f\u53c3\u6578\u66f4\u6709\u6548\u7387\u3002<\/li>\n<\/ul>\n\n\n\n<h3 class=\"wp-block-heading\">DeepSpeed-Inference<\/h3>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u8d85\u5927\u6a21\u578b\u4f4e\u5ef6\u9072\u63a8\u7406<\/strong>\uff0c\u7d50\u5408\u81ea\u7814\u9ad8\u6027\u80fd\u63a8\u7406\u5167\u6838\u548c\u901a\u8a0a\u512a\u5316\uff0c\u5343\u5104\u7d1a\u6a21\u578b\u4e5f\u80fd\u5feb\u901f\u3001\u591a\u4e26\u767c\u670d\u52d9\u4e0a\u7dda\u3002<\/li>\n\n\n\n<li><strong>\u7570\u8cea\u8a18\u61b6\u9ad4\u8abf\u5ea6<\/strong>\uff0c\u652f\u63f4CPU+GPU\/NVMe\u6df7\u5408\u5b58\u5132\uff0c\u5927\u5e45\u964d\u4f4e\u986f\u5b58\u9700\u6c42\u3002<\/li>\n<\/ul>\n\n\n\n<h3 class=\"wp-block-heading\">DeepSpeed-Compression<\/h3>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u58d3\u7e2e\u8207\u91cf\u5316\u4e00\u9ad4\u5316<\/strong>\uff0c\u5167\u5efaZeroQuant\u3001XTC\u7b49\u5c16\u7aef\u6280\u8853\uff0c\u652f\u63f4\u5168\u81ea\u52d5\u58d3\u7e2e\uff0c\u65b9\u4fbf\u9810\u6e2c\u90e8\u7f72\u3002<\/li>\n\n\n\n<li><strong>\u9748\u6d3b\u4e26\u53ef\u7d44\u5408\u7684\u58d3\u7e2eAPI<\/strong>\uff0c\u517c\u5bb9\u79d1\u7814\u8207\u5de5\u696d\u9700\u6c42\u3002<\/li>\n<\/ul>\n\n\n\n<p>\u66f4\u591a\u8a73\u898b <a href=\"https:\/\/www.deepspeed.ai\/technology\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >DeepSpeed\u529f\u80fd\u5217\u8868<\/a>\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">DeepSpeed\u7684\u50f9\u683c&amp; \u65b9\u6848<\/h2>\n\n\n\n<p><strong>DeepSpeed\u5b8c\u5168\u958b\u6e90\u514d\u8cbb<\/strong>\uff0c\u7528\u6236\u53ef\u4ee5\u5728<a href=\"https:\/\/github.com\/microsoft\/DeepSpeed\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >GitHub<\/a>\u5feb\u901f\u53d6\u5f97\u539f\u59cb\u78bc\uff0c\u4f01\u696d\u5546\u7528\u3001\u79d1\u7814\u5747\u53ef\u7121\u9580\u6abb\u4f7f\u7528\u3002\u5b98\u65b9\u9084\u63d0\u4f9b\uff1a<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img decoding=\"async\" width=\"1595\" height=\"918\" src=\"https:\/\/aicats.wiki\/wp-content\/uploads\/2025\/08\/image-213.png\" alt=\"GitHub\u958b\u6e90\" class=\"wp-image-23629\"\/><figcaption class=\"wp-element-caption\">\u5716\uff0f<a href=\"https:\/\/github.com\/microsoft\/DeepSpeed\" title=\"\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >GitHub\u958b\u6e90<\/a><\/figcaption><\/figure>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u6df1\u5ea6Hugging Face Transformers\u3001PyTorch\u3001PyTorch Lightning\u96c6\u6210\uff0c\u964d\u4f4e\u6a21\u578b\u9077\u79fb\u8207\u4e8c\u6b21\u958b\u767c\u9580\u6abb\u3002<\/li>\n\n\n\n<li>\u5fae\u8edfAzure \u4e0a\u5b8c\u6574\u652f\u6301\uff0c\u53ef\u76f4\u63a5\u900f\u904eAzureML\u4e00\u9375\u958b\u555f\u5206\u6563\u5f0f\u8a13\u7df4\u3002\u8a73\u898b <a href=\"https:\/\/github.com\/Azure\/azureml-examples\/tree\/main\/python-sdk\/workflows\/train\/deepspeed\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >AzureML\u5b98\u65b9\u6307\u5f15<\/a>\u3002<\/li>\n<\/ul>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>\u65b9\u6848<\/th><th>\u50f9\u683c<\/th><th>\u9069\u7528\u5834\u666f<\/th><\/tr><\/thead><tbody><tr><td><strong>\u958b\u6e90\u672c\u5730\u90e8\u7f72<\/strong><\/td><td>\u514d\u8cbb<\/td><td>\u5167\u90e8\u6216\u7814\u7a76\u8cc7\u6599\u3001\u53ef\u81ea\u8a02\u74b0\u5883<\/td><\/tr><tr><td><strong>Azure\u96f2\u7aefAI\u8a13\u7df4<\/strong><\/td><td>\u6309\u96f2\u7aef\u8cc7\u6e90\u8a08\u8cbb<\/td><td>\u5f48\u6027\u64f4\u5c55\u3001\u9ad8\u6548\u80fd\u53e2\u96c6\u3001\u5927\u898f\u6a21\u751f\u7522\u74b0\u5883<\/td><\/tr><tr><td><strong>\u793e\u5340\u652f\u6301\u8207\u4f01\u696d\u5408\u4f5c<\/strong><\/td><td>\u90e8\u5206\u5546\u696d\u670d\u52d9\u8cbb<\/td><td>\u5ba2\u88fd\u5316\u6280\u8853\u652f\u63f4\u3001\u884c\u696d\u7d1a\u6301\u7e8c\u96c6\u6210<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<p>DeepSpeed\u4e0d\u6536\u53d6\u7368\u7acb\u6388\u6b0a\u6216\u4f7f\u7528\u8cbb\uff0c\u793e\u5340\u8207\u4f01\u696d\u670d\u52d9\u8acb\u53c3\u898b<a href=\"https:\/\/www.deepspeed.ai\/support\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >DeepSpeed\u793e\u5340<\/a>\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">\u5982\u4f55\u4f7f\u7528DeepSpeed<\/h2>\n\n\n\n<h3 class=\"wp-block-heading\">\u5b89\u88dd<\/h3>\n\n\n\n<p>DeepSpeed\u652f\u63f4Linux\u3001Windows\u3001\u4e3b\u6d41GPU\u67b6\u69cb\uff08\u5305\u542bNVIDIA\u3001AMD\u3001Intel\u652f\u63f4\uff09\uff0c\u7c21\u55aepip\u4e00\u884c\u5373\u53ef\uff1a<\/p>\n\n\n\n<!--wp-compress-html--><!--wp-compress-html no compression-->\n<pre class=\"wp-block-code\"><code>pip install deepspeed<\/code><\/pre>\n<!--wp-compress-html no compression--><!--wp-compress-html-->\n\n\n\n<p>\u8a73\u7d30\u74b0\u5883&amp;\u52a0\u901f\u5668\u652f\u63f4\u898b <a href=\"https:\/\/www.deepspeed.ai\/tutorials\/accelerator-setup-guide\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u8a2d\u5099\u76f8\u5bb9\u6027\u5217\u8868<\/a>\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">\u5feb\u901f\u6574\u5408\u8a13\u7df4\/\u63a8\u7406\u7a0b\u5f0f\u78bc<\/h3>\n\n\n\n<p>\u4ee5PyTorch\u70ba\u4f8b\uff0c\u53ea\u9700\u4e09\u500b\u6b65\u9a5f\uff1a<\/p>\n\n\n\n<h4 class=\"wp-block-heading\">1. \u914d\u7f6eDeepSpeed\u53c3\u6578\uff08ds_config.json\uff09<\/h4>\n\n\n\n<!--wp-compress-html--><!--wp-compress-html no compression-->\n<pre class=\"wp-block-code\"><code>{ &quot;train_batch_size&quot;: 8, &quot;gradient_accumulation_steps&quot;: 1, &quot;optimizer&quot;: {&quot;type&quot;: &quot;Adam&quot;, &quot;params&quot;: {&quot;lr&quot;: 0.00015}}, &quot;fp16&quot;: {&quot;enabled&quot;: trueopt =<\/code><\/pre>\n<!--wp-compress-html no compression--><!--wp-compress-html-->\n\n\n\n<figure class=\"wp-block-image size-full\"><img loading=\"lazy\" decoding=\"async\" width=\"1595\" height=\"918\" src=\"https:\/\/aicats.wiki\/wp-content\/uploads\/2025\/08\/image-214.png\" alt=\"\u8a2d\u5099\u76f8\u5bb9\u6027\u5217\u8868\" class=\"wp-image-23632\"\/><figcaption class=\"wp-element-caption\">\u5716\uff0f<a href=\"https:\/\/www.deepspeed.ai\/tutorials\/accelerator-setup-guide\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u8a2d\u5099\u76f8\u5bb9\u6027\u5217\u8868<\/a><\/figcaption><\/figure>\n\n\n\n<h4 class=\"wp-block-heading\">2. \u521d\u59cb\u5316DeepSpeed\u5f15\u64ce\uff08\u8a13\u7df4\u7bc4\u4f8b\uff09<\/h4>\n\n\n\n<!--wp-compress-html--><!--wp-compress-html no compression-->\n<pre class=\"wp-block-code\"><code>import deepspeed model, optimizer, _, _ = deepspeed.initialize(args=cmd_args, model=model, model_parameters=params)<\/code><\/pre>\n<!--wp-compress-html no compression--><!--wp-compress-html-->\n\n\n\n<h4 class=\"wp-block-heading\">3. \u555f\u52d5\u5206\u6563\u5f0f\u8a13\u7df4\u6307\u4ee4<\/h4>\n\n\n\n<!--wp-compress-html--><!--wp-compress-html no compression-->\n<pre class=\"wp-block-code\"><code>deepspeed --num_gpus=4 --deepspeed --deepspeed_config ds_config.json<\/code><\/pre>\n<!--wp-compress-html no compression--><!--wp-compress-html-->\n\n\n\n<p>\u8a73\u7d30\u7528\u6cd5\u53ef\u898b<a href=\"https:\/\/www.deepspeed.ai\/getting-started\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u5b98\u65b9\u5165\u9580\u6559\u5b78<\/a>\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">\u96f2\u7aef\u4e00\u9375\u8a66\u7528<\/h3>\n\n\n\n<p>\u5fae\u8edfAzure\u900f\u904e<a href=\"https:\/\/github.com\/Azure\/azureml-examples\/issues\" title=\"\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >AzureML<\/a>\u63d0\u4f9bDeepSpeed\u6a21\u677f\uff0c\u9069\u5408\u96f2\u7aef\u904b\u7b97\u5f48\u6027\u8cc7\u6e90\u7684\u5927\u898f\u6a21AI\u8a13\u7df4\u5834\u666f\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">Hugging Face\u3001Lightning\u539f\u751f\u96c6\u6210<\/h3>\n\n\n\n<p>\u4e00\u53e5\u6307\u4ee4+config\u5373\u53ef\u8b93Transformers\u3001PyTorch Lightning\u4efb\u52d9\u63a5\u5165DeepSpeed\u52a0\u901f\uff0c\u898b <a href=\"https:\/\/huggingface.co\/docs\/transformers\/deepspeed\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >HF\u6574\u5408\u6559\u7a0b<\/a>\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img loading=\"lazy\" decoding=\"async\" width=\"1595\" height=\"918\" src=\"https:\/\/aicats.wiki\/wp-content\/uploads\/2025\/08\/image-215-1.jpg\" alt=\"HF\u6574\u5408\u6559\u7a0b\" class=\"wp-image-23636\"\/><figcaption class=\"wp-element-caption\">\u5716\uff0f<a href=\"https:\/\/huggingface.co\/docs\/transformers\/deepspeed\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >HF\u6574\u5408\u6559\u7a0b<\/a><\/figcaption><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">DeepSpeed\u7684\u9069\u7528\u4eba\u7fa4<\/h2>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>\u89d2\u8272<\/th><th>\u4f7f\u7528\u50f9\u503c<\/th><\/tr><\/thead><tbody><tr><td><strong>AI\u7814\u767c\u5718\u968a<\/strong><\/td><td>\u8a13\u7df4\u5343\u5104\u53c3\u6578\u5927\u6a21\u578b\uff0c\u5927\u5e45\u964d\u4f4e\u6210\u672c\u8207\u958b\u767c\u96e3\u5ea6<\/td><\/tr><tr><td><strong>AI\u65b0\u5275\u516c\u53f8<\/strong><\/td><td>\u5229\u7528\u958b\u6e90\u96c6\u7fa4\uff0c\u4f4e\u9580\u6abb\u5be6\u73fe\u696d\u754c\u9818\u5148\u7684\u6a21\u578b\u8a13\u7df4<\/td><\/tr><tr><td><strong>\u5b78\u8853\u79d1\u5b78\u7814\u7a76\u5718\u968a<\/strong><\/td><td>\u64f4\u5c55\u8ad6\u6587\u7d1a\u5be6\u9a57\u898f\u6a21\uff0c\u63a8\u52d5\u5927\u6a21\u578b\u7406\u8ad6\u8207\u65b0\u6f14\u7b97\u6cd5\u7a81\u7834<\/td><\/tr><tr><td><strong>\u96f2\u7aef\u670d\u52d9&amp;\u5927\u5ee0<\/strong><\/td><td>\u9762\u5411SaaS\/PaaS AI\u670d\u52d9\uff0c\u652f\u6490\u8d85\u9ad8\u4e26\u767c\u8207\u5927\u6a21\u578b\u63a8\u7406\u4f4e\u5ef6\u9072\u90e8\u7f72<\/td><\/tr><tr><td><strong>DL\u6846\u67b6\u958b\u767c\u8005<\/strong><\/td><td>\u6df1\u5ea6\u6574\u5408\u5206\u6563\u5f0f\u6700\u4f73\u5316\u8207\u6a21\u578b\u58d3\u7e2e\u6280\u8853\uff0c\u958b\u653e\u81ea\u8a02\u6700\u4f73\u5316\u8207\u63d2\u4ef6\u6846\u67b6<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<p>\u9069\u5408\u4e00\u5207\u5c0d<strong>AI\u8a13\u7df4\u6a21\u578b<\/strong>\u6709\u9ad8\u6027\u80fd\u3001\u4f4e\u6210\u672c\u3001\u6613\u64f4\u5c55\u9700\u6c42\u7684\u4f01\u696d\u8207\u500b\u4eba\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">DeepSpeed\u6574\u5408\u8207\u751f\u614b<\/h2>\n\n\n\n<p><strong>DeepSpeed\u64c1\u6709\u9ad8\u5ea6\u958b\u653e\u8207\u8c50\u5bcc\u7684\u751f\u614b\uff1a<\/strong><\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u8207\u4e3b\u6d41DL\u6846\u67b6\u7121\u7e2b\u96c6\u6210<\/strong>\uff1a\u5982Hugging Face Transformers\u3001Accelerate\u3001PyTorch Lightning\u3001MosaicML\u7b49\u4e00\u9375\u5c0d\u63a5\uff0c\n<ul class=\"wp-block-list\">\n<li>\u6848\u4f8b\u898b<a href=\"https:\/\/www.deepspeed.ai\/integrations\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u6574\u5408\u6587\u6a94<\/a>\u3002<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li><strong>\u652f\u63f4\u96f2\u7aef\u539f\u751f\u8207\u672c\u5730\u90e8\u7f72<\/strong>\uff1aAzure\u3001Kubernetes\u7b49\u5e73\u53f0\u5747\u6709\u5b98\u65b9\u90e8\u7f72\u7bc4\u4f8b\u3002<\/li>\n\n\n\n<li><strong>\u4e3b\u6d41AI\u5927\u6a21\u578b\u6a19\u914d<\/strong>\uff1aMT-530B\u3001BLOOM\u3001Jurassic-1\u3001GLM\u3001GPT-NeoX\u7b49\u7686\u4f7f\u7528DeepSpeed\u5b8c\u6210\u8a13\u7df4\/\u63a8\u7406\u3002<\/li>\n<\/ul>\n\n\n\n<h2 class=\"wp-block-heading\">\u5e38\u898b\u554f\u984c<\/h2>\n\n\n\n<h3 class=\"wp-block-heading\">DeepSpeed\u652f\u63f4\u7684\u5206\u6563\u5f0fAI\u8a13\u7df4\u6709\u54ea\u4e9b\u985e\u578b\uff1f<\/h3>\n\n\n\n<p>DeepSpeed\u652f\u63f4\u8cc7\u6599\u4e26\u884c\uff08Data Parallel\uff09\u3001\u6a21\u578b\u4e26\u884c\uff08Model Parallel\uff09\u3001\u6d41\u6c34\u7dda\u4e26\u884c\uff08Pipeline Parallel\uff09\u3001\u5f35\u91cf\u4e26\u884c\uff08Tensor Parallel\uff09\u3001\u5c08\u5bb6\u6a21\u578b\u4e26\u884c\uff08Expert Parallel\uff09\u7b49\u4e3b\u6d41\u8a13\u7df4\u7bc4\u5f0f\uff0c\u5354\u540cZeRO\u7b49\u5275\u65b0\u6f14\u7b97\u6cd5\uff0c\u9069\u7528\u65bc\u5f9e\u55ae\u6a5f\u591a\u74f6\u5230\u5343\u5361\u6a5f\u7d44\uff0c\u6975\u5927\u5730\u6e1b\u5c11\u5404\u7a2e\u5834\u666f\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u66f4\u591aZeRO\u5206\u6563\u5f0f\u8aaa\u660e\u898b <a href=\"https:\/\/www.deepspeed.ai\/training\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u5b98\u65b9\u57f9\u8a13\u6280\u8853\u9801\u9762<\/a>\u3002<\/li>\n<\/ul>\n\n\n\n<h3 class=\"wp-block-heading\">\u5982\u679c\u9810\u7b97\u6709\u9650\uff0cDeepSpeed\u662f\u5426\u4e5f\u9069\u5408\u4e2d\u5c0f\u578b\u5718\u968a\uff1f<\/h3>\n\n\n\n<p>\u662f\u7684\u3002 DeepSpeed\u5275\u65b0\u7684\u8a18\u61b6\u9ad4\u7ba1\u7406\u548c\u5206\u6563\u5f0f\u7b56\u7565\u80fd\u8b93\u4e2d\u5c0f\u578b\u5718\u968a\u5229\u7528\u5e02\u552e\u55ae\u6a5f\u4f3a\u670d\u5668\u3001\u96f2\u7aef\u4e2d\u4f4e\u914dGPU\u5be6\u73fe\u4ee5\u5f80\u53ea\u6709\u300cAI\u5de8\u982d\u300d\u80fd\u5b8c\u6210\u7684\u8d85\u5927\u6a21\u578b\u8a13\u7df4\u3002\u4e26\u4e14\u5176\u5c0dCPU\u3001NVMe\u7b49\u5132\u5b58\u7684\u7570\u8cea\u512a\u5316\uff0c\u964d\u4f4e\u9ad8\u914d\u786c\u9ad4\u6295\u5165\u9580\u6abb\u3002\u90e8\u7f72\u53c3\u8003 <a href=\"https:\/\/www.deepspeed.ai\/getting-started\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u8cc7\u6e90\u914d\u7f6e\u6587\u6a94<\/a>\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img loading=\"lazy\" decoding=\"async\" width=\"1595\" height=\"918\" src=\"https:\/\/aicats.wiki\/wp-content\/uploads\/2025\/08\/image-215.png\" alt=\"\u8cc7\u6e90\u914d\u7f6e\u6587\u6a94\u3002\" class=\"wp-image-23639\"\/><figcaption class=\"wp-element-caption\">\u5716\uff0f<a href=\"https:\/\/www.deepspeed.ai\/getting-started\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u8cc7\u6e90\u914d\u7f6e\u6587\u6a94<\/a>\u3002<\/figcaption><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\">DeepSpeed\u5c0d\u63a8\u7406\u90e8\u7f72\u548c\u6a21\u578b\u58d3\u7e2e\u6709\u4ec0\u9ebc\u5e6b\u52a9\uff1f<\/h3>\n\n\n\n<p>DeepSpeed-Inference\u548cDeepSpeed-Compression\u53ef\u5c07\u767e\u5104\u53c3\u6578\u6a21\u578b\u8f15\u9b06\u300c\u88dd\u4e0b\u300d8G\u53ca\u4ee5\u4e0a\u986f\u5b58\u5361\uff0c\u4e26\u986f\u8457\u63d0\u5347\u63a8\u7406\u4e26\u767c\u80fd\u529b\u548c\u901f\u5ea6\u3002 ZeroQuant\u7b49\u6280\u8853\u9084\u80fd\u5be6\u73fe\u6975\u4f4e\u6210\u672c\u7684W4A8\u7b49\u91cf\u5316\u6a21\u578b\uff0c\u65b9\u4fbf\u908a\u7de3\/\u4f4e\u983b\u5bec\u5834\u666f\u90e8\u7f72\u3002\u67e5\u770b <a href=\"https:\/\/www.deepspeed.ai\/inference\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u63a8\u7406\u6280\u8853\u9801\u9762<\/a> \u548c <a href=\"https:\/\/www.deepspeed.ai\/compression\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >\u58d3\u7e2e\u529f\u80fd<\/a> \u53d6\u5f97\u8a73\u7d30\u8cc7\u6599\u548c\u958b\u6e90\u5de5\u5177\u3002<\/p>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<p>\u96a8\u8457\u5927\u6a21\u578b\u6642\u4ee3\u5168\u9762\u5230\u4f86\uff0c<strong>DeepSpeed\u5df2\u6210\u70baAI\u8a13\u7df4\u6a21\u5f0f\u7684\u6838\u5fc3\u5f15\u64ce<\/strong>\u3002\u5b83\u7684\u958b\u6e90\u958b\u653e\u8207\u6975\u81f4\u6548\u80fd\uff0c\u8b93\u5f9e\u521d\u5b78\u8005\u5230AI\u5de8\u64d8\u90fd\u80fd\u6309\u9700\u5efa\u7acb\u5c6c\u65bc\u81ea\u5df1\u7684\u667a\u6167\u6a21\u578b\u3002\u7121\u8ad6\u4f60\u8eab\u8655AI\u79d1\u7814\u3001\u5de5\u696d\u843d\u5730\u6216\u96f2\u7aef\u539f\u751f\u670d\u52d9\uff0cDeepSpeed\u90fd\u662f\u4f60\u63a2\u7d22AI\u908a\u754c\u3001\u63d0\u5347\u6548\u7387\u8207\u63a7\u88fd\u6210\u672c\u7684\u5f37\u529b\u81c2\u8180\u3002\u7acb\u5373\u524d\u5f80<a href=\"https:\/\/www.deepspeed.ai\/\" target=\"_blank\"  rel=\"nofollow noopener\"  class=\"external\" >DeepSpeed\u5b98\u7db2<\/a>\uff0c\u958b\u555fAI\u8a13\u7df4\u7684\u7121\u9650\u53ef\u80fd\u3002<\/p>","protected":false},"author":3,"comment_status":"open","ping_status":"closed","template":"","meta":{"_crsspst_to_aicatswiki":false,"_monsterinsights_skip_tracking":false,"_monsterinsights_sitenote_active":false,"_monsterinsights_sitenote_note":"","_monsterinsights_sitenote_category":0},"content_visibility":[262],"sitetag":[17,812,811,830],"favorites":[577],"class_list":{"0":"post-19891","1":"sites","2":"type-sites","3":"status-publish","4":"hentry","5":"sitetag-ai","9":"favorites-ai-models"},"aioseo_notices":[],"_links":{"self":[{"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/sites\/19891","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/sites"}],"about":[{"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/types\/sites"}],"author":[{"embeddable":true,"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/users\/3"}],"replies":[{"embeddable":true,"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/comments?post=19891"}],"version-history":[{"count":2,"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/sites\/19891\/revisions"}],"predecessor-version":[{"id":23642,"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/sites\/19891\/revisions\/23642"}],"wp:attachment":[{"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/media?parent=19891"}],"wp:term":[{"taxonomy":"content_visibility","embeddable":true,"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/content_visibility?post=19891"},{"taxonomy":"sitetag","embeddable":true,"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/sitetag?post=19891"},{"taxonomy":"favorites","embeddable":true,"href":"https:\/\/aicats.wiki\/tw\/wp-json\/wp\/v2\/favorites?post=19891"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}