diff --git a/docs/_posts/2023-08-24-ulysses-chinese.md b/docs/_posts/2023-08-24-ulysses-chinese.md new file mode 100644 index 0000000000000000000000000000000000000000..613af2fe75838c6f6b5fbaf778d91351cce525c5 --- /dev/null +++ b/docs/_posts/2023-08-24-ulysses-chinese.md @@ -0,0 +1,7 @@ +--- +title: "DeepSpeed Ulysses: 训练极长序列Transformer模型的系统优化" +excerpt: "" +link: https://github.com/microsoft/DeepSpeed/blob/master/blogs/deepspeed-ulysses/chinese/README.md +date: 2023-08-24 00:00:00 +tags: training ZeRO Chinese +--- diff --git a/docs/_posts/2023-08-24-ulysses-japanese.md b/docs/_posts/2023-08-24-ulysses-japanese.md new file mode 100644 index 0000000000000000000000000000000000000000..921c7c28739df3fd85d08608ac645295dfb1b382 --- /dev/null +++ b/docs/_posts/2023-08-24-ulysses-japanese.md @@ -0,0 +1,7 @@ +--- +title: "DeepSpeed Ulysses: Transformerモデルを非常に長いシーケンスで訓練するための最適化" +excerpt: "" +link: https://github.com/microsoft/DeepSpeed/blob/master/blogs/deepspeed-ulysses/japanese/README.md +date: 2023-08-24 00:00:00 +tags: training ZeRO Japanese +--- diff --git a/docs/_posts/2023-08-24-ulysses.md b/docs/_posts/2023-08-24-ulysses.md new file mode 100644 index 0000000000000000000000000000000000000000..a88a0d66080a8eb297f3922a9a1987da3d609bd3 --- /dev/null +++ b/docs/_posts/2023-08-24-ulysses.md @@ -0,0 +1,7 @@ +--- +title: "DeepSpeed Ulysses: System Optimizations for Enabling Training of Extreme Long Sequence Transformer Models" +excerpt: "" +link: https://github.com/microsoft/DeepSpeed/blob/master/blogs/deepspeed-ulysses/README.md +date: 2023-08-24 00:00:00 +tags: training ZeRO English +---