{"provider_name":"Hatena Blog","height":"190","url":"https://inarizuuuushi.hatenablog.com/entry/2022/05/25/090000","version":"1.0","blog_url":"https://inarizuuuushi.hatenablog.com/","published":"2022-05-25 09:00:00","description":"@inproceedings{rajbhandari2020zero, title={Zero: Memory optimizations toward training trillion parameter models}, author={Rajbhandari, Samyam and Rasley, Jeff and Ruwase, Olatunji and He, Yuxiong}, booktitle={SC20: International Conference for High Performance Computing, Networking, Storage and Anal\u2026","author_url":"https://blog.hatena.ne.jp/inarizuuuushi/","categories":["\u8ad6\u6587\u30b5\u30fc\u30d9\u30a4"],"title":"\u30b5\u30fc\u30d9\u30a4: ZeRO: Memory Optimizations Toward Training Trillion Parameter Models","html":"<iframe src=\"https://hatenablog-parts.com/embed?url=https%3A%2F%2Finarizuuuushi.hatenablog.com%2Fentry%2F2022%2F05%2F25%2F090000\" title=\"\u30b5\u30fc\u30d9\u30a4: ZeRO: Memory Optimizations Toward Training Trillion Parameter Models - Sabrou-mal \u30b5\u30d6\u30ed\u30a6\u4e38\" class=\"embed-card embed-blogcard\" scrolling=\"no\" frameborder=\"0\" style=\"display: block; width: 100%; height: 190px; max-width: 500px; margin: 10px 0px;\"></iframe>","provider_url":"https://hatena.blog","author_name":"inarizuuuushi","image_url":"https://cdn-ak.f.st-hatena.com/images/fotolife/i/inarizuuuushi/20220520/20220520175259.png","width":"100%","type":"rich","blog_title":"Sabrou-mal \u30b5\u30d6\u30ed\u30a6\u4e38"}