From 68a4a1bf3df8aaf70359a9f5bafd7a1306f4099f Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Fri, 25 Feb 2022 10:48:10 -0800
Subject: [PATCH 01/20] add inference post

---
 docs/_posts/2021-05-05-MoQ.md               | 2 +-
 docs/_posts/2021-05-14-inference-release.md | 8 ++++++++
 2 files changed, 9 insertions(+), 1 deletion(-)
 create mode 100644 docs/_posts/2021-05-14-inference-release.md

diff --git a/docs/_posts/2021-05-05-MoQ.md b/docs/_posts/2021-05-05-MoQ.md
index 95dd8c7d1cb4..beecf3ab9ee6 100644
--- a/docs/_posts/2021-05-05-MoQ.md
+++ b/docs/_posts/2021-05-05-MoQ.md
@@ -4,7 +4,7 @@ title: "Mixture-of-Quantization: A novel quantization approach for reducing mode
 excerpt: ""
 categories: news
 new_post: false
-date: 2020-05-28 00:00:00
+date: 2021-05-05 00:00:00
 ---
 
 ## A unified suite for quantization-aware training and inference
diff --git a/docs/_posts/2021-05-14-inference-release.md b/docs/_posts/2021-05-14-inference-release.md
new file mode 100644
index 000000000000..5dc9fdc15c0a
--- /dev/null
+++ b/docs/_posts/2021-05-14-inference-release.md
@@ -0,0 +1,8 @@
+---
+layout: single
+title: "DeepSpeed: Accelerating large-scale model inference and training via system optimizations and compression"
+date:   2021-05-14
+link: https://www.microsoft.com/en-us/research/blog/deepspeed-accelerating-large-scale-model-inference-and-training-via-system-optimizations-and-compression/
+excerpt: "Developed by Microsoft AI & Research."
+categories: news
+---

From 8ba6415f2fc4758173025c063e6ac53cc9c80b0d Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Fri, 25 Feb 2022 13:24:59 -0800
Subject: [PATCH 02/20] fix format

---
 docs/_data/navigation.yml                     | 114 +++++++++---------
 docs/_layouts/feed.html                       |  22 ++++
 docs/_layouts/news-home.html                  |  13 +-
 docs/_layouts/tags.html                       |  16 +++
 docs/_posts/2020-02-13-release.md             |   1 +
 docs/_posts/2020-02-13-turing-nlg.md          |   1 +
 docs/_posts/2020-05-19-bert-record.md         |   1 +
 docs/_posts/2020-05-19-press-release.md       |   1 +
 docs/_posts/2020-05-19-zero-stage2.md         |   1 +
 .../2020-05-28-fastest-bert-training.md       |   1 +
 docs/_posts/2020-07-24-deepspeed-webinar.md   |   1 +
 docs/_posts/2020-08-07-webinar-on-demand.md   |   1 +
 .../2020-09-08-sparse-attention-news.md       |   1 +
 docs/_posts/2020-09-09-ZeRO-Offload.md        |   1 +
 .../2020-09-09-onebit-adam-blog-post.md       |   1 +
 docs/_posts/2020-09-09-onebit-adam-news.md    |   1 +
 .../_posts/2020-09-09-pipeline-parallelism.md |   1 +
 docs/_posts/2020-09-09-sparse-attention.md    |   1 +
 ...0-10-28-progressive-layer-dropping-news.md |   1 +
 docs/_posts/2021-03-08-zero3-offload.md       |   1 +
 docs/_posts/2021-05-05-MoQ.md                 |   1 +
 ...021-05-05-inference-kernel-optimization.md |   1 +
 docs/_posts/2021-05-14-inference-release.md   |   1 +
 docs/_posts/2021-08-18-deepspeed-moe.md       |   1 +
 docs/_posts/2021-11-15-autotuning.md          |   1 +
 docs/_posts/2021-12-09-deepspeed-moe-nlg.md   |   1 +
 docs/_posts/2022-01-19-moe-inference.md       |   1 +
 27 files changed, 129 insertions(+), 59 deletions(-)
 create mode 100644 docs/_layouts/feed.html
 create mode 100644 docs/_layouts/tags.html

diff --git a/docs/_data/navigation.yml b/docs/_data/navigation.yml
index afdc7e218705..00a3184b5b2e 100755
--- a/docs/_data/navigation.yml
+++ b/docs/_data/navigation.yml
@@ -1,120 +1,120 @@
 main:
-  - title: "Getting Started"
+  - title: 'Getting Started'
     url: /getting-started/
-  - title: "News"
+  - title: 'Blog'
     url: /news/
-  - title: "Tutorials"
+  - title: 'Tutorials'
     url: /tutorials/
-  - title: "Documentation"
+  - title: 'Documentation'
     url: https://deepspeed.readthedocs.io/
-  - title: "GitHub"
+  - title: 'GitHub'
     url: https://github.com/microsoft/DeepSpeed
 
 lnav:
-  - title: "Feature Overview"
+  - title: 'Feature Overview'
     url: /features/
-  - title: "Getting Started"
+  - title: 'Getting Started'
     url: /getting-started/
     children:
-      - title: "Installation"
+      - title: 'Installation'
         url: /getting-started/#installation
-      - title: "Writing models"
+      - title: 'Writing models'
         url: /getting-started/#writing-deepspeed-models
-      - title: "Training"
+      - title: 'Training'
         url: /getting-started/#training
-      - title: "Launching"
+      - title: 'Launching'
         url: /getting-started/#launching-deepspeed-training
-  - title: "Configuration"
+  - title: 'Configuration'
     url: /docs/config-json/
     children:
-      - title: "Autotuning"
+      - title: 'Autotuning'
         url: /docs/config-json/#autotuning
-      - title: "Batch size"
+      - title: 'Batch size'
         url: /docs/config-json/#batch-size-related-parameters
-      - title: "Optimizer"
+      - title: 'Optimizer'
         url: /docs/config-json/#optimizer-parameters
-      - title: "Scheduler"
+      - title: 'Scheduler'
         url: /docs/config-json/#scheduler-parameters
-      - title: "Communication"
+      - title: 'Communication'
         url: /docs/config-json/#communication-options
-      - title: "FP16"
+      - title: 'FP16'
         url: /docs/config-json/#fp16-training-options
-      - title: "BFOAT16"
+      - title: 'BFOAT16'
         url: /docs/config-json/#bfloat16-training-options
-      - title: "Gradient Clipping"
+      - title: 'Gradient Clipping'
         url: /docs/config-json/#gradient-clipping
-      - title: "ZeRO optimizations"
+      - title: 'ZeRO optimizations'
         url: /docs/config-json/#zero-optimizations-for-fp16-training
-      - title: "Parameter Offloading"
+      - title: 'Parameter Offloading'
         url: /docs/config-json/#parameter-offloading
-      - title: "Optimizer Offloading"
+      - title: 'Optimizer Offloading'
         url: /docs/config-json/#optimizer-offloading
-      - title: "Asynchronous I/O"
+      - title: 'Asynchronous I/O'
         url: /docs/config-json/#asynchronous-io
-      - title: "Logging"
+      - title: 'Logging'
         url: /docs/config-json/#logging
-      - title: "Flops Profiler"
+      - title: 'Flops Profiler'
         url: /docs/config-json/#flops-profiler
-      - title: "PyTorch Profiler"
+      - title: 'PyTorch Profiler'
         url: /docs/config-json/#pytorch-profiler
-      - title: "Activation checkpointing"
+      - title: 'Activation checkpointing'
         url: /docs/config-json/#activation-checkpointing
-      - title: "Sparse Attention"
+      - title: 'Sparse Attention'
         url: /docs/config-json/#sparse-attention
-      - title: "Logging to TensorBoard"
+      - title: 'Logging to TensorBoard'
         url: /docs/config-json/#tensorboard-options
-  - title: "Tutorials"
+  - title: 'Tutorials'
     url: /tutorials/
     children:
-      - title: "Getting started"
+      - title: 'Getting started'
         url: /getting-started/
-      - title: "Getting started on Azure"
+      - title: 'Getting started on Azure'
         url: /tutorials/azure/
-      - title: "Autotuning"
+      - title: 'Autotuning'
         url: /tutorials/autotuning/
-      - title: "BingBertSQuAD Fine-tuning"
+      - title: 'BingBertSQuAD Fine-tuning'
         url: /tutorials/bert-finetuning/
-      - title: "BERT Pre-training"
+      - title: 'BERT Pre-training'
         url: /tutorials/bert-pretraining/
-      - title: "CIFAR-10"
+      - title: 'CIFAR-10'
         url: /tutorials/cifar-10/
-      - title: "Curriculum Learning"
+      - title: 'Curriculum Learning'
         url: /tutorials/curriculum-learning/
-      - title: "Flops Profiler"
+      - title: 'Flops Profiler'
         url: /tutorials/flops-profiler/
-      - title: "PyTorch Profiler"
+      - title: 'PyTorch Profiler'
         url: /tutorials/pytorch-profiler/
-      - title: "GAN"
+      - title: 'GAN'
         url: /tutorials/gan/
-      - title: "Inference"
+      - title: 'Inference'
         url: /tutorials/inference-tutorial/
-      - title: "Learning Rate Range Test"
+      - title: 'Learning Rate Range Test'
         url: /tutorials/lrrt/
-      - title: "Megatron-LM GPT2"
+      - title: 'Megatron-LM GPT2'
         url: /tutorials/megatron/
-      - title: "Mixture-of-Experts (MoE)"
+      - title: 'Mixture-of-Experts (MoE)'
         url: /tutorials/mixture-of-experts/
-      - title: "Mixture-of-Experts for NLG"
+      - title: 'Mixture-of-Experts for NLG'
         url: /tutorials/mixture-of-experts-nlg/
-      - title: "Mixture-of-Quantization"
+      - title: 'Mixture-of-Quantization'
         url: /tutorials/MoQ-tutorial/
-      - title: "One-Cycle Schedule"
+      - title: 'One-Cycle Schedule'
         url: /tutorials/one-cycle/
-      - title: "One-Bit Adam"
+      - title: 'One-Bit Adam'
         url: /tutorials/onebit-adam/
-      - title: "One-Bit LAMB"
+      - title: 'One-Bit LAMB'
         url: /tutorials/onebit-lamb/
-      - title: "Pipeline Parallelism"
+      - title: 'Pipeline Parallelism'
         url: /tutorials/pipeline/
-      - title: "Progressive Layer Dropping"
+      - title: 'Progressive Layer Dropping'
         url: /tutorials/progressive_layer_dropping/
-      - title: "Sparse Attention"
+      - title: 'Sparse Attention'
         url: /tutorials/sparse-attention/
-      - title: "Transformer Kernel"
+      - title: 'Transformer Kernel'
         url: /tutorials/transformer_kernel/
-      - title: "ZeRO-Offload"
+      - title: 'ZeRO-Offload'
         url: /tutorials/zero-offload/
-      - title: "ZeRO Redundancy Optimizer (ZeRO)"
+      - title: 'ZeRO Redundancy Optimizer (ZeRO)'
         url: /tutorials/zero/
-  - title: "Contributing"
+  - title: 'Contributing'
     url: /contributing/
diff --git a/docs/_layouts/feed.html b/docs/_layouts/feed.html
new file mode 100644
index 000000000000..83b137b6908e
--- /dev/null
+++ b/docs/_layouts/feed.html
@@ -0,0 +1,22 @@
+<?xml version="1.0" encoding="utf-8"?>
+<feed xmlns="http://www.w3.org/2005/Atom">
+  <title>{{ site.title }}</title>
+  <link href="{{ '/atom.xml' | relative_url }}" rel="self" />
+  <link href="{{ site.url }}{{ site.baseurl }}/" />
+  <updated>{{ site.time | date_to_xmlschema }}</updated>
+  <id>{{ site.url }}</id>
+  <author>
+    <name>{{ site.author.name }}</name>
+    <email>{{ site.author.email }}</email>
+  </author>
+
+  {% for post in site.posts %} {% if post.tags contains page.tag-name %}
+  <entry>
+    <title>{{ post.title | xml_escape }}</title>
+    <link href="{{ site.url }}{{ site.baseurl }}{{ post.url }}" />
+    <updated>{{ post.date | date_to_xmlschema }}</updated>
+    <id>{{ site.url }}{{ post.id }}</id>
+    <content type="html">{{ post.content | xml_escape }}</content>
+  </entry>
+  {% endif %} {% endfor %}
+</feed>
diff --git a/docs/_layouts/news-home.html b/docs/_layouts/news-home.html
index 8248eed5b551..116b4208e4fe 100644
--- a/docs/_layouts/news-home.html
+++ b/docs/_layouts/news-home.html
@@ -11,7 +11,7 @@
   {% assign posts = site.posts %}
 {% endif %}
 
-
+<!--
 <h2>{{ site.data.ui-text[site.locale].recent_posts | default: "Recent Posts" }}</h2>
 {% assign news = posts | where: "sneak_preview", "false" %}
 {% for post in news %}
@@ -21,4 +21,13 @@ <h2>{{ site.data.ui-text[site.locale].recent_posts | default: "Recent Posts" }}<
   {% endif %}
 {% endfor %}
 
-{% include paginator.html %}
+{% include paginator.html %} -->
+
+{% for tag in site.tags %}
+  <h3>{{ tag[0] }}</h3>
+  <ul>
+    {% for post in tag[1] %}
+      <li><a href="{{ post.url }}">{{ post.title }}</a></li>
+    {% endfor %}
+  </ul>
+{% endfor %}
diff --git a/docs/_layouts/tags.html b/docs/_layouts/tags.html
new file mode 100644
index 000000000000..43f34f6771f4
--- /dev/null
+++ b/docs/_layouts/tags.html
@@ -0,0 +1,16 @@
+---
+layout: default
+---
+
+<div>
+  <h1>Articles tagged with ""</h1>
+  <ul style='padding-top: 16px;'>
+
+  {% for post in site.posts %}
+    {% if post.tags contains page.tag-name %}
+      <li><a href="{{ post.url }}">{{ post.title }}</a>, published {{ post.date | date: "%Y-%m-%d" }}</li>
+    {% endif %}
+  {% endfor %}
+
+  </ul>
+</div>
diff --git a/docs/_posts/2020-02-13-release.md b/docs/_posts/2020-02-13-release.md
index 968e97c9b420..6c5a063845ea 100644
--- a/docs/_posts/2020-02-13-release.md
+++ b/docs/_posts/2020-02-13-release.md
@@ -5,4 +5,5 @@ date:   2020-02-13
 link: https://www.microsoft.com/en-us/research/blog/zero-deepspeed-new-system-optimizations-enable-training-models-with-over-100-billion-parameters/
 excerpt: "Developed by Microsoft AI & Research."
 categories: news
+tags: training zero
 ---
diff --git a/docs/_posts/2020-02-13-turing-nlg.md b/docs/_posts/2020-02-13-turing-nlg.md
index 32ecd65379c1..05e99beca307 100644
--- a/docs/_posts/2020-02-13-turing-nlg.md
+++ b/docs/_posts/2020-02-13-turing-nlg.md
@@ -5,4 +5,5 @@ date:   2020-02-13
 link: https://www.microsoft.com/en-us/research/blog/turing-nlg-a-17-billion-parameter-language-model-by-microsoft/
 excerpt: "DeepSpeed was used to train the world's largest language model."
 categories: news
+tags: training
 ---
diff --git a/docs/_posts/2020-05-19-bert-record.md b/docs/_posts/2020-05-19-bert-record.md
index 4a00681cbfcd..db70c95cc1ab 100644
--- a/docs/_posts/2020-05-19-bert-record.md
+++ b/docs/_posts/2020-05-19-bert-record.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2020-05-19 00:00:00
+tags: training
 ---
 
 We introduce new technology to accelerate single GPU performance via kernel
diff --git a/docs/_posts/2020-05-19-press-release.md b/docs/_posts/2020-05-19-press-release.md
index 0a247e253074..c84192b297c7 100644
--- a/docs/_posts/2020-05-19-press-release.md
+++ b/docs/_posts/2020-05-19-press-release.md
@@ -6,4 +6,5 @@ link: https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-
 categories: news
 new_post: false
 date: 2020-05-19 02:00:00
+tags: training zero
 ---
diff --git a/docs/_posts/2020-05-19-zero-stage2.md b/docs/_posts/2020-05-19-zero-stage2.md
index 5ce3ad252223..87b5214d203f 100644
--- a/docs/_posts/2020-05-19-zero-stage2.md
+++ b/docs/_posts/2020-05-19-zero-stage2.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: false
 date: 2020-05-19 01:00:00
+tags: training zero
 ---
 
 ZeRO-2 expands the scope of memory optimizations in the original ZeRO by
diff --git a/docs/_posts/2020-05-28-fastest-bert-training.md b/docs/_posts/2020-05-28-fastest-bert-training.md
index 923319449bbf..9abaf96ec354 100644
--- a/docs/_posts/2020-05-28-fastest-bert-training.md
+++ b/docs/_posts/2020-05-28-fastest-bert-training.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: false
 date: 2020-05-28 00:00:00
+tags: training
 ---
 
 Good news! **DeepSpeed obtains the fastest BERT training record: 44 minutes on
diff --git a/docs/_posts/2020-07-24-deepspeed-webinar.md b/docs/_posts/2020-07-24-deepspeed-webinar.md
index 276b97c9522e..57e67ba654c6 100644
--- a/docs/_posts/2020-07-24-deepspeed-webinar.md
+++ b/docs/_posts/2020-07-24-deepspeed-webinar.md
@@ -7,4 +7,5 @@ link: https://note.microsoft.com/MSR-Webinar-DeepSpeed-Registration-On-Demand.ht
 image: /assets/images/webinar-aug2020.png
 new_post: true
 date: 2020-07-24 00:00:00
+tags: presentations
 ---
diff --git a/docs/_posts/2020-08-07-webinar-on-demand.md b/docs/_posts/2020-08-07-webinar-on-demand.md
index 6d255520c0df..6ee2c77031ed 100644
--- a/docs/_posts/2020-08-07-webinar-on-demand.md
+++ b/docs/_posts/2020-08-07-webinar-on-demand.md
@@ -6,4 +6,5 @@ categories: news
 link: https://note.microsoft.com/MSR-Webinar-DeepSpeed-Registration-On-Demand.html
 new_post: true
 date: 2020-08-07 00:00:00
+tags: presentations
 ---
diff --git a/docs/_posts/2020-09-08-sparse-attention-news.md b/docs/_posts/2020-09-08-sparse-attention-news.md
index 6f235818c33f..2cb1d0007a91 100644
--- a/docs/_posts/2020-09-08-sparse-attention-news.md
+++ b/docs/_posts/2020-09-08-sparse-attention-news.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2020-09-09 00:00:00
+tags: training
 ---
 
 DeepSpeed offers sparse attention kernels, an instrumental technology to support long sequences of model inputs, whether for text, image, or sound. Compared with the classic dense Transformers, it powers an order-of-magnitude longer input sequence and obtains up to 6x faster execution with comparable accuracy. It also outperforms state-of-the-art sparse implementations with 1.5-3x faster execution. Furthermore, our sparse kernels support efficient execution of flexible sparse format and empower users to innovate on their custom sparse structures.
diff --git a/docs/_posts/2020-09-09-ZeRO-Offload.md b/docs/_posts/2020-09-09-ZeRO-Offload.md
index 9a45ba8f244e..6c108d25156a 100755
--- a/docs/_posts/2020-09-09-ZeRO-Offload.md
+++ b/docs/_posts/2020-09-09-ZeRO-Offload.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2020-09-09 00:00:00
+tags: training zero
 ---
 
 We introduce a new technology called ZeRO-Offload to enable **10X bigger model training on a single GPU**. ZeRO-Offload extends ZeRO-2 to leverage both CPU and GPU memory for training large models. Using a machine with **a single GPU**, our users now can run **models of up to 13 billion parameters** without running out of memory, 10x bigger than the existing approaches, while obtaining competitive throughput. This feature democratizes multi-billion-parameter model training and opens the window for many deep learning practitioners to explore bigger and better models.
diff --git a/docs/_posts/2020-09-09-onebit-adam-blog-post.md b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
index b16a101578f0..6e8836a0e1f3 100644
--- a/docs/_posts/2020-09-09-onebit-adam-blog-post.md
+++ b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: false
 date: 2020-09-09 00:00:00
+tags: training communication
 ---
 
 ## 1. Introduction
diff --git a/docs/_posts/2020-09-09-onebit-adam-news.md b/docs/_posts/2020-09-09-onebit-adam-news.md
index 5dc0f3bd2004..c0ffe748bad2 100644
--- a/docs/_posts/2020-09-09-onebit-adam-news.md
+++ b/docs/_posts/2020-09-09-onebit-adam-news.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2020-09-09 00:00:00
+tags: training communication
 ---
 
 
diff --git a/docs/_posts/2020-09-09-pipeline-parallelism.md b/docs/_posts/2020-09-09-pipeline-parallelism.md
index d8aa20c1cee5..5b588e32f5d6 100644
--- a/docs/_posts/2020-09-09-pipeline-parallelism.md
+++ b/docs/_posts/2020-09-09-pipeline-parallelism.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2020-09-09 00:00:00
+tags: training
 ---
 
 DeepSpeed includes new support for pipeline parallelism! DeepSpeed's training
diff --git a/docs/_posts/2020-09-09-sparse-attention.md b/docs/_posts/2020-09-09-sparse-attention.md
index 79032eeaa153..2dc0c368df82 100644
--- a/docs/_posts/2020-09-09-sparse-attention.md
+++ b/docs/_posts/2020-09-09-sparse-attention.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2020-09-09 01:00:00
+tags: training inference
 ---
 
 Attention-based deep learning models such as the transformers are highly effective in capturing relationship between tokens in an input sequence, even across long distances. As a result, they are used with text, image, and sound-based inputs, where the sequence length can be in thousands of tokens. However, despite the effectiveness of attention modules to capture long term dependencies, in practice, their application to long sequence input is limited by compute and memory requirements of the attention computation that grow quadratically, `O(n^2)`, with the sequence length `n`.
diff --git a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
index 5659cf818987..3e06f2dfe72c 100755
--- a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
+++ b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2020-10-29 00:00:00
+tags: training
 ---
 
 We introduce a new technology called progressive layer dropping (PLD) to speedup the pre-training of Transformer-based networks through efficient and robust compressed training. The pre-training step of Transformer networks often suffer from unbearable overall computational expenses. We analyze the training dynamics and stability of Transformer networks and propose PLD to sparsely update Transformer blocks following a progressive dropping schedule, which smoothly increases the layer dropping rate for each mini-batch as training evolves along both the temporal and the model depth dimension. PLD is able to allow the pre-training to be **2.5X faster** to get similar accuracy on downstream tasks and allows the training to be **24% faster** when training the same number of samples, not at the cost of excessive hardware resources.
diff --git a/docs/_posts/2021-03-08-zero3-offload.md b/docs/_posts/2021-03-08-zero3-offload.md
index 8e5778afa0fc..e9c8cd470eff 100644
--- a/docs/_posts/2021-03-08-zero3-offload.md
+++ b/docs/_posts/2021-03-08-zero3-offload.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2021-03-08 00:00:00
+tags: training zero
 ---
 Today we are announcing the release of ZeRO-3 Offload, a highly efficient and easy to use implementation of ZeRO Stage 3 and ZeRO Offload combined, geared towards our continued goal of democratizing AI by making efficient large-scale DL training available to everyone.  The key benefits of ZeRO-3 Offload are:
 
diff --git a/docs/_posts/2021-05-05-MoQ.md b/docs/_posts/2021-05-05-MoQ.md
index beecf3ab9ee6..a9582c652ab4 100644
--- a/docs/_posts/2021-05-05-MoQ.md
+++ b/docs/_posts/2021-05-05-MoQ.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: false
 date: 2021-05-05 00:00:00
+tags: inference
 ---
 
 ## A unified suite for quantization-aware training and inference
diff --git a/docs/_posts/2021-05-05-inference-kernel-optimization.md b/docs/_posts/2021-05-05-inference-kernel-optimization.md
index 2042703f4729..218387c07f55 100644
--- a/docs/_posts/2021-05-05-inference-kernel-optimization.md
+++ b/docs/_posts/2021-05-05-inference-kernel-optimization.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: false
 date: 2021-03-16 00:00:00
+tags: inference
 ---
 While DeepSpeed supports training advanced large-scale models, using these trained models in the desired application scenarios is still challenging due to three major limitations in existing inference solutions: 1) lack of support for multi-GPU inference to fit large models and meet latency requirements, 2) limited GPU kernel performance when running inference with small batch sizes, and 3) difficulties in exploiting quantization, which includes both quantizing the model to reduce the model size and latency as well as supporting high-performance inference of quantized models without specialized hardware.
 
diff --git a/docs/_posts/2021-05-14-inference-release.md b/docs/_posts/2021-05-14-inference-release.md
index 5dc9fdc15c0a..658627e7115f 100644
--- a/docs/_posts/2021-05-14-inference-release.md
+++ b/docs/_posts/2021-05-14-inference-release.md
@@ -5,4 +5,5 @@ date:   2021-05-14
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-accelerating-large-scale-model-inference-and-training-via-system-optimizations-and-compression/
 excerpt: "Developed by Microsoft AI & Research."
 categories: news
+tags: inference
 ---
diff --git a/docs/_posts/2021-08-18-deepspeed-moe.md b/docs/_posts/2021-08-18-deepspeed-moe.md
index 3f21e26a74dd..0cc61f52d0fc 100644
--- a/docs/_posts/2021-08-18-deepspeed-moe.md
+++ b/docs/_posts/2021-08-18-deepspeed-moe.md
@@ -6,4 +6,5 @@ categories: news
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-powers-8x-larger-moe-model-training-with-high-performance/
 new_post: true
 date: 2021-08-18 00:00:00
+tags: training
 ---
diff --git a/docs/_posts/2021-11-15-autotuning.md b/docs/_posts/2021-11-15-autotuning.md
index dd8d94dcef02..00ea4f1aa27b 100644
--- a/docs/_posts/2021-11-15-autotuning.md
+++ b/docs/_posts/2021-11-15-autotuning.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: true
 date: 2021-11-16 00:00:00
+tags: training
 ---
 
 We introduce a new feature called Autotuning to automatically discover the optimal DeepSpeed configuration that delivers good training speed. One pain point in model training is to figure out good performance-relevant configurations such as micro-batch size to fully utilize the hardware and achieve a high throughput number. This configuration exploring process is commonly done manually but is important since model training is repeated many times and benefits from using a good configuration. Not only is the hand-tuning process time-consuming, but the outcome is hardware-dependent. This means that a good configuration on one hardware might not be the best on another different hardware. The user thus has to hand tune the configuration again. With DeepSpeed, there are more configuration parameters that could potentially affect the training speed, thus making it more tedious to manually tune the configuration.
diff --git a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
index b6898f2313d6..ea92b791c449 100644
--- a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
+++ b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
@@ -5,6 +5,7 @@ excerpt: ""
 categories: news
 new_post: false
 date: 2021-12-09 22:00:00
+tags: training
 ---
 
 Published on December 9, 2021
diff --git a/docs/_posts/2022-01-19-moe-inference.md b/docs/_posts/2022-01-19-moe-inference.md
index 88046f72c6fa..1554f7bc5fc0 100644
--- a/docs/_posts/2022-01-19-moe-inference.md
+++ b/docs/_posts/2022-01-19-moe-inference.md
@@ -6,4 +6,5 @@ categories: news
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-advancing-moe-inference-and-training-to-power-next-generation-ai-scale/
 new_post: true
 date: 2022-01-19 00:00:00
+tags: inference
 ---

From 993fccd92c89258103cd86bb8fdef1a3f45dc056 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Sat, 26 Feb 2022 10:46:03 +0500
Subject: [PATCH 03/20] use categories filtering

---
 docs/_layouts/news-home.html                  | 38 +++++++++++++-
 docs/_layouts/news.html                       | 52 +++++++++++++++++++
 docs/_posts/2020-02-13-release.md             |  3 +-
 docs/_posts/2020-02-13-turing-nlg.md          |  3 +-
 docs/_posts/2020-05-19-bert-record.md         |  3 +-
 docs/_posts/2020-05-19-press-release.md       |  3 +-
 docs/_posts/2020-05-19-zero-stage2.md         |  3 +-
 .../2020-05-28-fastest-bert-training.md       |  3 +-
 docs/_posts/2020-07-24-deepspeed-webinar.md   |  3 +-
 docs/_posts/2020-08-07-webinar-on-demand.md   |  3 +-
 .../2020-09-08-sparse-attention-news.md       |  3 +-
 docs/_posts/2020-09-09-ZeRO-Offload.md        |  3 +-
 .../2020-09-09-onebit-adam-blog-post.md       |  3 +-
 docs/_posts/2020-09-09-onebit-adam-news.md    |  3 +-
 .../_posts/2020-09-09-pipeline-parallelism.md |  3 +-
 docs/_posts/2020-09-09-sparse-attention.md    |  3 +-
 ...0-10-28-progressive-layer-dropping-news.md |  3 +-
 docs/_posts/2021-03-08-zero3-offload.md       |  3 +-
 docs/_posts/2021-05-05-MoQ.md                 |  3 +-
 ...021-05-05-inference-kernel-optimization.md |  3 +-
 docs/_posts/2021-05-14-inference-release.md   |  3 +-
 docs/_posts/2021-08-18-deepspeed-moe.md       |  3 +-
 docs/_posts/2021-11-15-autotuning.md          |  3 +-
 docs/_posts/2021-12-09-deepspeed-moe-nlg.md   |  3 +-
 docs/_posts/2022-01-19-moe-inference.md       |  3 +-
 docs/news/index.html                          |  2 +-
 26 files changed, 112 insertions(+), 49 deletions(-)
 create mode 100644 docs/_layouts/news.html

diff --git a/docs/_layouts/news-home.html b/docs/_layouts/news-home.html
index 116b4208e4fe..0ebdf0ea609f 100644
--- a/docs/_layouts/news-home.html
+++ b/docs/_layouts/news-home.html
@@ -11,6 +11,40 @@
   {% assign posts = site.posts %}
 {% endif %}
 
+<div class="button-group filter-button-group justify-content-center">
+  <a class="btn btn-sm btn-primary" data-filter=".training">Training</a>
+  <a class="btn btn-sm btn-primary" data-filter=".inference">Inference</a>
+  <a class="btn btn-sm btn-primary active" data-filter="*">All</a>
+</div>
+
+<div class="grid">
+  {% for post in site.posts %}
+     <div class="col-md-4 col-sm-6 post-item {{ post.tags }}">
+        <a class="post-link" data-toggle="modal" href="#p{{ forloop.index }}">
+          <img class="img-fluid" src="{{ post.caption.thumbnail }}" alt="">
+        </a>
+     </div>
+  {% endfor %}
+</div>
+
+<script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha256-cCueBR6CsyA4/9szpPfrX3s49M9vUU5BgtiJj06wt/s=" crossorigin="anonymous"></script>
+<script src="https://unpkg.com/isotope-layout@3.0/dist/isotope.pkgd.js"></script>
+<script src="https://unpkg.com/imagesloaded@4/imagesloaded.pkgd.min.js"></script>
+
+<script>
+  var $grid = $('.grid').imagesLoaded( function() {
+      $grid.isotope({});
+  });
+  $('.filter-button-group').on( 'click', 'a', function() {
+      var filterValue = $(this).attr('data-filter');
+      $grid.isotope({ filter: filterValue });
+   });
+   $('.button-group a.btn').on('click', function(){
+      $('.button-group a.btn').removeClass('active');
+      $(this).addClass('active');
+   });
+</script>
+
 <!--
 <h2>{{ site.data.ui-text[site.locale].recent_posts | default: "Recent Posts" }}</h2>
 {% assign news = posts | where: "sneak_preview", "false" %}
@@ -23,11 +57,11 @@ <h2>{{ site.data.ui-text[site.locale].recent_posts | default: "Recent Posts" }}<
 
 {% include paginator.html %} -->
 
-{% for tag in site.tags %}
+<!-- {% for tag in site.tags %}
   <h3>{{ tag[0] }}</h3>
   <ul>
     {% for post in tag[1] %}
       <li><a href="{{ post.url }}">{{ post.title }}</a></li>
     {% endfor %}
   </ul>
-{% endfor %}
+{% endfor %} -->
diff --git a/docs/_layouts/news.html b/docs/_layouts/news.html
new file mode 100644
index 000000000000..d0d5f82787ac
--- /dev/null
+++ b/docs/_layouts/news.html
@@ -0,0 +1,52 @@
+---
+layout: archive
+post-content:
+backsite: javascript:history.back()
+---
+
+{% if paginator %}
+  {% assign posts = paginator.posts %}
+{% else %}
+  {% assign posts = site.posts %}
+{% endif %}
+
+<script type="text/javascript">
+    function filterUsingCategory(selectedCategory) {
+      var id = 0;
+      {% for post in site.posts %}
+        var cats = {{ post.categories | jsonify }}
+
+        var postDiv = document.getElementById(++id);
+        postDiv.style.display = (selectedCategory == 'All' || cats.includes(selectedCategory))
+          ? 'unset'
+          : 'none';
+      {% endfor %}
+    }
+  </script>
+
+  <div>
+    <button id="All" onclick="filterUsingCategory('All')">*Show All Posts*</button>
+    {% assign categories = site.categories | sort %}
+    {% for category in categories %}
+      {% assign cat = category | first %}
+      <button id="{{ cat }}" onclick="filterUsingCategory(this.id)">{{ cat }}</button>
+    {% endfor %}
+    <hr />
+  </div>
+
+  <div class="posts-wrapper">
+    {% assign id = 0 %}
+    {% for post in site.posts %}
+      {% assign id = id | plus:1 %}
+      <div class="post" id="{{id}}">
+        <p class="itemInteriorSection">
+          <a href="{{post.url}}">{{ post.articletitle }}</a><br />
+            <span><b>&middot;</b></span>
+            {% include archive-single.html %}
+            {% if post.image %}
+              <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
+            {% endif %}
+        </p>
+      </div>
+    {% endfor %}
+  </div>
\ No newline at end of file
diff --git a/docs/_posts/2020-02-13-release.md b/docs/_posts/2020-02-13-release.md
index 6c5a063845ea..d8482de7288b 100644
--- a/docs/_posts/2020-02-13-release.md
+++ b/docs/_posts/2020-02-13-release.md
@@ -4,6 +4,5 @@ title: "ZeRO & DeepSpeed: New system optimizations enable training models with o
 date:   2020-02-13
 link: https://www.microsoft.com/en-us/research/blog/zero-deepspeed-new-system-optimizations-enable-training-models-with-over-100-billion-parameters/
 excerpt: "Developed by Microsoft AI & Research."
-categories: news
-tags: training zero
+categories: training zero
 ---
diff --git a/docs/_posts/2020-02-13-turing-nlg.md b/docs/_posts/2020-02-13-turing-nlg.md
index 05e99beca307..cb9ee59e314f 100644
--- a/docs/_posts/2020-02-13-turing-nlg.md
+++ b/docs/_posts/2020-02-13-turing-nlg.md
@@ -4,6 +4,5 @@ title: "Turing-NLG: A 17-billion-parameter language model by Microsoft"
 date:   2020-02-13
 link: https://www.microsoft.com/en-us/research/blog/turing-nlg-a-17-billion-parameter-language-model-by-microsoft/
 excerpt: "DeepSpeed was used to train the world's largest language model."
-categories: news
-tags: training
+categories: training
 ---
diff --git a/docs/_posts/2020-05-19-bert-record.md b/docs/_posts/2020-05-19-bert-record.md
index db70c95cc1ab..ce2f58b231f1 100644
--- a/docs/_posts/2020-05-19-bert-record.md
+++ b/docs/_posts/2020-05-19-bert-record.md
@@ -2,10 +2,9 @@
 layout: single
 title: "The Fastest and Most Efficient BERT Training through Optimized Transformer Kernels"
 excerpt: ""
-categories: news
+categories: training
 new_post: true
 date: 2020-05-19 00:00:00
-tags: training
 ---
 
 We introduce new technology to accelerate single GPU performance via kernel
diff --git a/docs/_posts/2020-05-19-press-release.md b/docs/_posts/2020-05-19-press-release.md
index c84192b297c7..b8e2dd09b02f 100644
--- a/docs/_posts/2020-05-19-press-release.md
+++ b/docs/_posts/2020-05-19-press-release.md
@@ -3,8 +3,7 @@ layout: single
 title: "ZeRO-2 & DeepSpeed: Shattering Barriers of Deep Learning Speed & Scale"
 excerpt: ""
 link: https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/
-categories: news
+categories: training zero
 new_post: false
 date: 2020-05-19 02:00:00
-tags: training zero
 ---
diff --git a/docs/_posts/2020-05-19-zero-stage2.md b/docs/_posts/2020-05-19-zero-stage2.md
index 87b5214d203f..39504032d2ae 100644
--- a/docs/_posts/2020-05-19-zero-stage2.md
+++ b/docs/_posts/2020-05-19-zero-stage2.md
@@ -2,10 +2,9 @@
 layout: single
 title: "An Order-of-Magnitude Larger and Faster Training with ZeRO-2"
 excerpt: ""
-categories: news
+categories: training zero
 new_post: false
 date: 2020-05-19 01:00:00
-tags: training zero
 ---
 
 ZeRO-2 expands the scope of memory optimizations in the original ZeRO by
diff --git a/docs/_posts/2020-05-28-fastest-bert-training.md b/docs/_posts/2020-05-28-fastest-bert-training.md
index 9abaf96ec354..1eaf6afc4f1b 100644
--- a/docs/_posts/2020-05-28-fastest-bert-training.md
+++ b/docs/_posts/2020-05-28-fastest-bert-training.md
@@ -2,10 +2,9 @@
 layout: single
 title: "Microsoft DeepSpeed achieves the fastest BERT training time"
 excerpt: ""
-categories: news
+categories: training
 new_post: false
 date: 2020-05-28 00:00:00
-tags: training
 ---
 
 Good news! **DeepSpeed obtains the fastest BERT training record: 44 minutes on
diff --git a/docs/_posts/2020-07-24-deepspeed-webinar.md b/docs/_posts/2020-07-24-deepspeed-webinar.md
index 57e67ba654c6..58f3674845e3 100644
--- a/docs/_posts/2020-07-24-deepspeed-webinar.md
+++ b/docs/_posts/2020-07-24-deepspeed-webinar.md
@@ -2,10 +2,9 @@
 layout: single
 title: "DeepSpeed Microsoft Research Webinar on August 6th, 2020"
 excerpt: ""
-categories: news
+categories: presentations
 link: https://note.microsoft.com/MSR-Webinar-DeepSpeed-Registration-On-Demand.html
 image: /assets/images/webinar-aug2020.png
 new_post: true
 date: 2020-07-24 00:00:00
-tags: presentations
 ---
diff --git a/docs/_posts/2020-08-07-webinar-on-demand.md b/docs/_posts/2020-08-07-webinar-on-demand.md
index 6ee2c77031ed..3173df1f7881 100644
--- a/docs/_posts/2020-08-07-webinar-on-demand.md
+++ b/docs/_posts/2020-08-07-webinar-on-demand.md
@@ -2,9 +2,8 @@
 layout: single
 title: "DeepSpeed Microsoft Research Webinar is now on-demand"
 excerpt: ""
-categories: news
+categories: presentations
 link: https://note.microsoft.com/MSR-Webinar-DeepSpeed-Registration-On-Demand.html
 new_post: true
 date: 2020-08-07 00:00:00
-tags: presentations
 ---
diff --git a/docs/_posts/2020-09-08-sparse-attention-news.md b/docs/_posts/2020-09-08-sparse-attention-news.md
index 2cb1d0007a91..3d5c4cdcb5f9 100644
--- a/docs/_posts/2020-09-08-sparse-attention-news.md
+++ b/docs/_posts/2020-09-08-sparse-attention-news.md
@@ -2,10 +2,9 @@
 layout: single
 title: "Powering 10x longer sequences and 6x faster execution through DeepSpeed Sparse Attention"
 excerpt: ""
-categories: news
+categories: training
 new_post: true
 date: 2020-09-09 00:00:00
-tags: training
 ---
 
 DeepSpeed offers sparse attention kernels, an instrumental technology to support long sequences of model inputs, whether for text, image, or sound. Compared with the classic dense Transformers, it powers an order-of-magnitude longer input sequence and obtains up to 6x faster execution with comparable accuracy. It also outperforms state-of-the-art sparse implementations with 1.5-3x faster execution. Furthermore, our sparse kernels support efficient execution of flexible sparse format and empower users to innovate on their custom sparse structures.
diff --git a/docs/_posts/2020-09-09-ZeRO-Offload.md b/docs/_posts/2020-09-09-ZeRO-Offload.md
index 6c108d25156a..749683b25ec9 100755
--- a/docs/_posts/2020-09-09-ZeRO-Offload.md
+++ b/docs/_posts/2020-09-09-ZeRO-Offload.md
@@ -2,10 +2,9 @@
 layout: single
 title: "10x bigger model training on a single GPU with ZeRO-Offload"
 excerpt: ""
-categories: news
 new_post: true
 date: 2020-09-09 00:00:00
-tags: training zero
+categories: training zero
 ---
 
 We introduce a new technology called ZeRO-Offload to enable **10X bigger model training on a single GPU**. ZeRO-Offload extends ZeRO-2 to leverage both CPU and GPU memory for training large models. Using a machine with **a single GPU**, our users now can run **models of up to 13 billion parameters** without running out of memory, 10x bigger than the existing approaches, while obtaining competitive throughput. This feature democratizes multi-billion-parameter model training and opens the window for many deep learning practitioners to explore bigger and better models.
diff --git a/docs/_posts/2020-09-09-onebit-adam-blog-post.md b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
index 6e8836a0e1f3..ffe0f69f317f 100644
--- a/docs/_posts/2020-09-09-onebit-adam-blog-post.md
+++ b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
@@ -2,10 +2,9 @@
 layout: single
 title: "DeepSpeed with 1-bit Adam: 5x less communication and 3.4x faster training"
 excerpt: ""
-categories: news
 new_post: false
 date: 2020-09-09 00:00:00
-tags: training communication
+categories: training communication
 ---
 
 ## 1. Introduction
diff --git a/docs/_posts/2020-09-09-onebit-adam-news.md b/docs/_posts/2020-09-09-onebit-adam-news.md
index c0ffe748bad2..109631251962 100644
--- a/docs/_posts/2020-09-09-onebit-adam-news.md
+++ b/docs/_posts/2020-09-09-onebit-adam-news.md
@@ -2,10 +2,9 @@
 layout: single
 title: "Up to 5x less communication and 3.4x faster training through 1-bit Adam"
 excerpt: ""
-categories: news
 new_post: true
 date: 2020-09-09 00:00:00
-tags: training communication
+categories: training communication
 ---
 
 
diff --git a/docs/_posts/2020-09-09-pipeline-parallelism.md b/docs/_posts/2020-09-09-pipeline-parallelism.md
index 5b588e32f5d6..af537ffcd62c 100644
--- a/docs/_posts/2020-09-09-pipeline-parallelism.md
+++ b/docs/_posts/2020-09-09-pipeline-parallelism.md
@@ -2,10 +2,9 @@
 layout: single
 title: "Training a Trillion Parameters with Pipeline Parallelism"
 excerpt: ""
-categories: news
 new_post: true
 date: 2020-09-09 00:00:00
-tags: training
+categories: training
 ---
 
 DeepSpeed includes new support for pipeline parallelism! DeepSpeed's training
diff --git a/docs/_posts/2020-09-09-sparse-attention.md b/docs/_posts/2020-09-09-sparse-attention.md
index 2dc0c368df82..40fdfb449ef1 100644
--- a/docs/_posts/2020-09-09-sparse-attention.md
+++ b/docs/_posts/2020-09-09-sparse-attention.md
@@ -2,10 +2,9 @@
 layout: single
 title: "DeepSpeed Sparse Attention"
 excerpt: ""
-categories: news
 new_post: true
 date: 2020-09-09 01:00:00
-tags: training inference
+categories: training inference
 ---
 
 Attention-based deep learning models such as the transformers are highly effective in capturing relationship between tokens in an input sequence, even across long distances. As a result, they are used with text, image, and sound-based inputs, where the sequence length can be in thousands of tokens. However, despite the effectiveness of attention modules to capture long term dependencies, in practice, their application to long sequence input is limited by compute and memory requirements of the attention computation that grow quadratically, `O(n^2)`, with the sequence length `n`.
diff --git a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
index 3e06f2dfe72c..53a995da93b6 100755
--- a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
+++ b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
@@ -2,10 +2,9 @@
 layout: single
 title: "Progressive Layer Dropping"
 excerpt: ""
-categories: news
 new_post: true
 date: 2020-10-29 00:00:00
-tags: training
+categories: training
 ---
 
 We introduce a new technology called progressive layer dropping (PLD) to speedup the pre-training of Transformer-based networks through efficient and robust compressed training. The pre-training step of Transformer networks often suffer from unbearable overall computational expenses. We analyze the training dynamics and stability of Transformer networks and propose PLD to sparsely update Transformer blocks following a progressive dropping schedule, which smoothly increases the layer dropping rate for each mini-batch as training evolves along both the temporal and the model depth dimension. PLD is able to allow the pre-training to be **2.5X faster** to get similar accuracy on downstream tasks and allows the training to be **24% faster** when training the same number of samples, not at the cost of excessive hardware resources.
diff --git a/docs/_posts/2021-03-08-zero3-offload.md b/docs/_posts/2021-03-08-zero3-offload.md
index e9c8cd470eff..ea394e46fc37 100644
--- a/docs/_posts/2021-03-08-zero3-offload.md
+++ b/docs/_posts/2021-03-08-zero3-offload.md
@@ -2,10 +2,9 @@
 layout: single
 title: "DeepSpeed ZeRO-3 Offload"
 excerpt: ""
-categories: news
 new_post: true
 date: 2021-03-08 00:00:00
-tags: training zero
+categories: training zero
 ---
 Today we are announcing the release of ZeRO-3 Offload, a highly efficient and easy to use implementation of ZeRO Stage 3 and ZeRO Offload combined, geared towards our continued goal of democratizing AI by making efficient large-scale DL training available to everyone.  The key benefits of ZeRO-3 Offload are:
 
diff --git a/docs/_posts/2021-05-05-MoQ.md b/docs/_posts/2021-05-05-MoQ.md
index a9582c652ab4..8e2255293dbe 100644
--- a/docs/_posts/2021-05-05-MoQ.md
+++ b/docs/_posts/2021-05-05-MoQ.md
@@ -2,10 +2,9 @@
 layout: single
 title: "Mixture-of-Quantization: A novel quantization approach for reducing model size with minimal accuracy impact"
 excerpt: ""
-categories: news
 new_post: false
 date: 2021-05-05 00:00:00
-tags: inference
+categories: inference
 ---
 
 ## A unified suite for quantization-aware training and inference
diff --git a/docs/_posts/2021-05-05-inference-kernel-optimization.md b/docs/_posts/2021-05-05-inference-kernel-optimization.md
index 218387c07f55..933e00fa7449 100644
--- a/docs/_posts/2021-05-05-inference-kernel-optimization.md
+++ b/docs/_posts/2021-05-05-inference-kernel-optimization.md
@@ -2,10 +2,9 @@
 layout: single
 title: "DeepSpeed Inference: Multi-GPU inference with customized inference kernels and quantization support"
 excerpt: ""
-categories: news
 new_post: false
 date: 2021-03-16 00:00:00
-tags: inference
+categories: inference
 ---
 While DeepSpeed supports training advanced large-scale models, using these trained models in the desired application scenarios is still challenging due to three major limitations in existing inference solutions: 1) lack of support for multi-GPU inference to fit large models and meet latency requirements, 2) limited GPU kernel performance when running inference with small batch sizes, and 3) difficulties in exploiting quantization, which includes both quantizing the model to reduce the model size and latency as well as supporting high-performance inference of quantized models without specialized hardware.
 
diff --git a/docs/_posts/2021-05-14-inference-release.md b/docs/_posts/2021-05-14-inference-release.md
index 658627e7115f..2f6755d3679d 100644
--- a/docs/_posts/2021-05-14-inference-release.md
+++ b/docs/_posts/2021-05-14-inference-release.md
@@ -4,6 +4,5 @@ title: "DeepSpeed: Accelerating large-scale model inference and training via sys
 date:   2021-05-14
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-accelerating-large-scale-model-inference-and-training-via-system-optimizations-and-compression/
 excerpt: "Developed by Microsoft AI & Research."
-categories: news
-tags: inference
+categories: inference
 ---
diff --git a/docs/_posts/2021-08-18-deepspeed-moe.md b/docs/_posts/2021-08-18-deepspeed-moe.md
index 0cc61f52d0fc..86e27ff2edb7 100644
--- a/docs/_posts/2021-08-18-deepspeed-moe.md
+++ b/docs/_posts/2021-08-18-deepspeed-moe.md
@@ -2,9 +2,8 @@
 layout: single
 title: "DeepSpeed powers 8x larger MoE model training with high performance"
 excerpt: ""
-categories: news
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-powers-8x-larger-moe-model-training-with-high-performance/
 new_post: true
 date: 2021-08-18 00:00:00
-tags: training
+categories: training
 ---
diff --git a/docs/_posts/2021-11-15-autotuning.md b/docs/_posts/2021-11-15-autotuning.md
index 00ea4f1aa27b..509f691e57f1 100644
--- a/docs/_posts/2021-11-15-autotuning.md
+++ b/docs/_posts/2021-11-15-autotuning.md
@@ -2,10 +2,9 @@
 layout: single
 title: "Autotuning: Automatically discover the optimal DeepSpeed configuration that delivers good training speed"
 excerpt: ""
-categories: news
 new_post: true
 date: 2021-11-16 00:00:00
-tags: training
+categories: training
 ---
 
 We introduce a new feature called Autotuning to automatically discover the optimal DeepSpeed configuration that delivers good training speed. One pain point in model training is to figure out good performance-relevant configurations such as micro-batch size to fully utilize the hardware and achieve a high throughput number. This configuration exploring process is commonly done manually but is important since model training is repeated many times and benefits from using a good configuration. Not only is the hand-tuning process time-consuming, but the outcome is hardware-dependent. This means that a good configuration on one hardware might not be the best on another different hardware. The user thus has to hand tune the configuration again. With DeepSpeed, there are more configuration parameters that could potentially affect the training speed, thus making it more tedious to manually tune the configuration.
diff --git a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
index ea92b791c449..2e2b19c9cc2e 100644
--- a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
+++ b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
@@ -2,10 +2,9 @@
 layout: single
 title: "DeepSpeed-MoE for NLG: Reducing the training cost of language models by 5 times"
 excerpt: ""
-categories: news
 new_post: false
 date: 2021-12-09 22:00:00
-tags: training
+categories: training
 ---
 
 Published on December 9, 2021
diff --git a/docs/_posts/2022-01-19-moe-inference.md b/docs/_posts/2022-01-19-moe-inference.md
index 1554f7bc5fc0..3cfab04b96cc 100644
--- a/docs/_posts/2022-01-19-moe-inference.md
+++ b/docs/_posts/2022-01-19-moe-inference.md
@@ -2,9 +2,8 @@
 layout: single
 title: "DeepSpeed: Advancing MoE inference and training to power next-generation AI scale"
 excerpt: ""
-categories: news
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-advancing-moe-inference-and-training-to-power-next-generation-ai-scale/
 new_post: true
 date: 2022-01-19 00:00:00
-tags: inference
+categories: inference
 ---
diff --git a/docs/news/index.html b/docs/news/index.html
index 95e7974b5050..6cfe0b7a14c1 100644
--- a/docs/news/index.html
+++ b/docs/news/index.html
@@ -1,3 +1,3 @@
 ---
-layout: news-home
+layout: news
 ---

From 234d7c2bf147053cb1af96438796cb2bfec4542c Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Sat, 26 Feb 2022 14:02:25 +0500
Subject: [PATCH 04/20] refactor posts layout and presentation

---
 docs/_config.yml                              |   9 +-
 docs/_data/navigation.yml                     |   2 +-
 docs/_includes/analytics.html                 |  14 +
 docs/_includes/archive-single.html            |  30 +++
 .../author-profile-custom-links.html          |   7 +
 docs/_includes/author-profile.html            | 252 ++++++++++++++++++
 docs/_includes/breadcrumbs.html               |  39 +++
 docs/_includes/browser-upgrade.html           |   3 +
 docs/_includes/category-list.html             |  26 ++
 docs/_includes/comment.html                   |  22 ++
 docs/_includes/comments.html                  | 159 +++++++++++
 docs/_includes/documents-collection.html      |  21 ++
 docs/_includes/feature_row                    |  41 +++
 docs/_includes/figure                         |   9 +
 docs/_includes/footer.html                    |  19 ++
 docs/_includes/gallery                        |  35 +++
 docs/_includes/group-by-array                 |  47 ++++
 docs/_includes/head.html                      |  37 +++
 docs/_includes/masthead.html                  |  37 +++
 docs/_includes/nav_list                       |  26 ++
 docs/_includes/page__date.html                |   5 +
 docs/_includes/page__hero.html                |  51 ++++
 docs/_includes/page__hero_video.html          |   2 +
 docs/_includes/page__meta.html                |  30 +++
 docs/_includes/page__taxonomy.html            |   7 +
 docs/_includes/paginator.html                 |  69 +++++
 docs/_includes/post_pagination.html           |  14 +
 docs/_includes/posts-category.html            |   5 +
 docs/_includes/posts-tag.html                 |   5 +
 docs/_includes/scripts.html                   |  28 ++
 docs/_includes/seo.html                       | 155 +++++++++++
 docs/_includes/sidebar.html                   |  19 ++
 docs/_includes/skip-links.html                |   8 +
 docs/_includes/social-share.html              |  11 +
 docs/_includes/tag-list.html                  |  26 ++
 docs/_includes/toc                            |   7 +
 docs/_includes/toc.html                       |  96 +++++++
 docs/_includes/video                          |  24 ++
 docs/_layouts/feed.html                       |  22 --
 docs/_layouts/news-home.html                  |  67 -----
 docs/_layouts/single-full.html                |  82 ++++++
 docs/_layouts/tags.html                       |  16 --
 docs/_posts/2020-02-13-release.md             |   3 +-
 docs/_posts/2020-02-13-turing-nlg.md          |   3 +-
 docs/_posts/2020-05-19-bert-record.md         |   4 +-
 docs/_posts/2020-05-19-press-release.md       |   4 +-
 docs/_posts/2020-05-19-zero-stage2.md         |   4 +-
 .../2020-05-28-fastest-bert-training.md       |   4 +-
 docs/_posts/2020-07-24-deepspeed-webinar.md   |   4 +-
 docs/_posts/2020-08-07-webinar-on-demand.md   |   4 +-
 .../2020-09-08-sparse-attention-news.md       |   4 +-
 docs/_posts/2020-09-09-ZeRO-Offload.md        |   4 +-
 .../2020-09-09-onebit-adam-blog-post.md       |   4 +-
 docs/_posts/2020-09-09-onebit-adam-news.md    |   4 +-
 .../_posts/2020-09-09-pipeline-parallelism.md |   4 +-
 docs/_posts/2020-09-09-sparse-attention.md    |   4 +-
 ...0-10-28-progressive-layer-dropping-news.md |   4 +-
 docs/_posts/2021-03-08-zero3-offload.md       |   4 +-
 docs/_posts/2021-05-05-MoQ.md                 |   4 +-
 ...021-05-05-inference-kernel-optimization.md |   4 +-
 docs/_posts/2021-05-14-inference-release.md   |   3 +-
 docs/_posts/2021-08-18-deepspeed-moe.md       |   4 +-
 docs/_posts/2021-11-15-autotuning.md          |   6 +-
 docs/_posts/2021-12-09-deepspeed-moe-nlg.md   |   6 +-
 docs/_posts/2022-01-19-moe-inference.md       |   4 +-
 docs/_sass/minimal-mistakes.scss              |  65 +++++
 docs/assets/css/main.scss                     |  64 +++++
 docs/news/index.html                          |   3 -
 docs/{_layouts/news.html => tags.md}          |  30 ++-
 docs/tags_list.md                             |  29 ++
 70 files changed, 1675 insertions(+), 193 deletions(-)
 create mode 100644 docs/_includes/analytics.html
 create mode 100644 docs/_includes/archive-single.html
 create mode 100644 docs/_includes/author-profile-custom-links.html
 create mode 100644 docs/_includes/author-profile.html
 create mode 100644 docs/_includes/breadcrumbs.html
 create mode 100644 docs/_includes/browser-upgrade.html
 create mode 100644 docs/_includes/category-list.html
 create mode 100644 docs/_includes/comment.html
 create mode 100644 docs/_includes/comments.html
 create mode 100644 docs/_includes/documents-collection.html
 create mode 100644 docs/_includes/feature_row
 create mode 100644 docs/_includes/figure
 create mode 100644 docs/_includes/footer.html
 create mode 100644 docs/_includes/gallery
 create mode 100644 docs/_includes/group-by-array
 create mode 100644 docs/_includes/head.html
 create mode 100644 docs/_includes/masthead.html
 create mode 100644 docs/_includes/nav_list
 create mode 100644 docs/_includes/page__date.html
 create mode 100644 docs/_includes/page__hero.html
 create mode 100644 docs/_includes/page__hero_video.html
 create mode 100644 docs/_includes/page__meta.html
 create mode 100644 docs/_includes/page__taxonomy.html
 create mode 100644 docs/_includes/paginator.html
 create mode 100644 docs/_includes/post_pagination.html
 create mode 100644 docs/_includes/posts-category.html
 create mode 100644 docs/_includes/posts-tag.html
 create mode 100644 docs/_includes/scripts.html
 create mode 100644 docs/_includes/seo.html
 create mode 100644 docs/_includes/sidebar.html
 create mode 100644 docs/_includes/skip-links.html
 create mode 100644 docs/_includes/social-share.html
 create mode 100644 docs/_includes/tag-list.html
 create mode 100644 docs/_includes/toc
 create mode 100644 docs/_includes/toc.html
 create mode 100644 docs/_includes/video
 delete mode 100644 docs/_layouts/feed.html
 delete mode 100644 docs/_layouts/news-home.html
 create mode 100644 docs/_layouts/single-full.html
 delete mode 100644 docs/_layouts/tags.html
 create mode 100644 docs/_sass/minimal-mistakes.scss
 delete mode 100644 docs/news/index.html
 rename docs/{_layouts/news.html => tags.md} (63%)
 create mode 100644 docs/tags_list.md

diff --git a/docs/_config.yml b/docs/_config.yml
index 87cc953255fe..e5642cbfcded 100644
--- a/docs/_config.yml
+++ b/docs/_config.yml
@@ -78,8 +78,15 @@ defaults:
       path: ""
       type: posts
     values:
-      layout: single
+      layout: single-full
+      classes: wide2
+      author_profile: false
+      read_time: false
+      comments: false
       share: true
+      related: false
+      toc: false
+      show_date: true
 
 analytics:
   provider: "google-gtag"
diff --git a/docs/_data/navigation.yml b/docs/_data/navigation.yml
index 00a3184b5b2e..9fa5e12b4d79 100755
--- a/docs/_data/navigation.yml
+++ b/docs/_data/navigation.yml
@@ -2,7 +2,7 @@ main:
   - title: 'Getting Started'
     url: /getting-started/
   - title: 'Blog'
-    url: /news/
+    url: /posts/
   - title: 'Tutorials'
     url: /tutorials/
   - title: 'Documentation'
diff --git a/docs/_includes/analytics.html b/docs/_includes/analytics.html
new file mode 100644
index 000000000000..371469f0af9b
--- /dev/null
+++ b/docs/_includes/analytics.html
@@ -0,0 +1,14 @@
+{% if jekyll.environment == 'production' and site.analytics.provider and page.analytics != false %}
+
+{% case site.analytics.provider %}
+{% when "google" %}
+  {% include /analytics-providers/google.html %}
+{% when "google-universal" %}
+  {% include /analytics-providers/google-universal.html %}
+{% when "google-gtag" %}
+  {% include /analytics-providers/google-gtag.html %}
+{% when "custom" %}
+  {% include /analytics-providers/custom.html %}
+{% endcase %}
+
+{% endif %}
\ No newline at end of file
diff --git a/docs/_includes/archive-single.html b/docs/_includes/archive-single.html
new file mode 100644
index 000000000000..68174807ef50
--- /dev/null
+++ b/docs/_includes/archive-single.html
@@ -0,0 +1,30 @@
+{% if post.header.teaser %}
+  {% capture teaser %}{{ post.header.teaser }}{% endcapture %}
+{% else %}
+  {% assign teaser = site.teaser %}
+{% endif %}
+
+{% if post.id %}
+  {% assign title = post.title | markdownify | remove: "<p>" | remove: "</p>" %}
+{% else %}
+  {% assign title = post.title %}
+{% endif %}
+
+<div class="{{ include.type | default: 'list' }}__item">
+  <article class="archive__item" itemscope itemtype="https://schema.org/CreativeWork">
+    {% if include.type == "grid" and teaser %}
+      <div class="archive__item-teaser">
+        <img src="{{ teaser | relative_url }}" alt="">
+      </div>
+    {% endif %}
+    <h2 class="archive__item-title no_toc" itemprop="headline">
+      {% if post.link %}
+        <a href="{{ post.link }}">{{ title }}</a> <a href="{{ post.url | relative_url }}" rel="permalink"><i class="fas fa-link" aria-hidden="true" title="permalink"></i><span class="sr-only">Permalink</span></a>
+      {% else %}
+        <a href="{{ post.url | relative_url }}" rel="permalink">{{ title }}</a>
+      {% endif %}
+    </h2>
+    {% include page__meta.html type=include.type %}
+    {% if post.excerpt %}<p class="archive__item-excerpt" itemprop="description">{{ post.excerpt | markdownify | strip_html | truncate: 160 }}</p>{% endif %}
+  </article>
+</div>
diff --git a/docs/_includes/author-profile-custom-links.html b/docs/_includes/author-profile-custom-links.html
new file mode 100644
index 000000000000..b89ffcb7df6c
--- /dev/null
+++ b/docs/_includes/author-profile-custom-links.html
@@ -0,0 +1,7 @@
+<!--
+  <li>
+    <a href="http://link-to-whatever-social-network.com/user/" itemprop="sameAs" rel="nofollow noopener noreferrer">
+      <i class="fas fa-fw" aria-hidden="true"></i> Custom Social Profile Link
+    </a>
+  </li>
+-->
\ No newline at end of file
diff --git a/docs/_includes/author-profile.html b/docs/_includes/author-profile.html
new file mode 100644
index 000000000000..d384ee734376
--- /dev/null
+++ b/docs/_includes/author-profile.html
@@ -0,0 +1,252 @@
+{% assign author = page.author | default: page.authors[0] | default: site.author %}
+{% assign author = site.data.authors[author] | default: author %}
+
+<div itemscope itemtype="https://schema.org/Person">
+
+  {% if author.avatar %}
+    <div class="author__avatar">
+      {% if author.home %}
+        <a href="{{ author.home | relative_url }}">
+          <img src="{{ author.avatar | relative_url }}" alt="{{ author.name }}" itemprop="image">
+        </a>
+      {% else %}
+        <img src="{{ author.avatar | relative_url }}" alt="{{ author.name }}" itemprop="image">
+      {% endif %}
+    </div>
+  {% endif %}
+
+  <div class="author__content">
+    {% if author.home %}
+      <a href="{{ author.home | relative_url }}"><h3 class="author__name" itemprop="name">{{ author.name }}</h3></a>
+    {% else %}
+      <h3 class="author__name" itemprop="name">{{ author.name }}</h3>
+    {% endif %}
+    {% if author.bio %}
+      <div class="author__bio" itemprop="description">
+        {{ author.bio | markdownify }}
+      </div>
+    {% endif %}
+  </div>
+
+  <div class="author__urls-wrapper">
+    <button class="btn btn--inverse">{{ site.data.ui-text[site.locale].follow_label | remove: ":" | default: "Follow" }}</button>
+    <ul class="author__urls social-icons">
+      {% if author.location %}
+        <li itemprop="homeLocation" itemscope itemtype="https://schema.org/Place">
+          <i class="fas fa-fw fa-map-marker-alt" aria-hidden="true"></i> <span itemprop="name">{{ author.location }}</span>
+        </li>
+      {% endif %}
+
+      {% if author.links %}
+        {% for link in author.links %}
+          {% if link.label and link.url %}
+            <li><a href="{{ link.url }}" rel="nofollow noopener noreferrer"><i class="{{ link.icon | default: 'fas fa-link' }}" aria-hidden="true"></i><span class="label">{{ link.label }}</span></a></li>
+          {% endif %}
+        {% endfor %}
+      {% endif %}
+
+      {% if author.uri %}
+        <li>
+          <a href="{{ author.uri }}" itemprop="url">
+            <i class="fas fa-fw fa-link" aria-hidden="true"></i><span class="label">{{ site.data.ui-text[site.locale].website_label | default: "Website" }}</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.email %}
+        <li>
+          <a href="mailto:{{ author.email }}">
+            <meta itemprop="email" content="{{ author.email }}" />
+            <i class="fas fa-fw fa-envelope-square" aria-hidden="true"></i><span class="label">{{ site.data.ui-text[site.locale].email_label | default: "Email" }}</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.keybase %}
+        <li>
+          <a href="https://keybase.io/{{ author.keybase }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fas fa-fw fa-key" aria-hidden="true"></i><span class="label">Keybase</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.twitter %}
+        <li>
+          <a href="https://twitter.com/{{ author.twitter }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-twitter-square" aria-hidden="true"></i><span class="label">Twitter</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.facebook %}
+        <li>
+          <a href="https://www.facebook.com/{{ author.facebook }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-facebook-square" aria-hidden="true"></i><span class="label">Facebook</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.linkedin %}
+        <li>
+          <a href="https://www.linkedin.com/in/{{ author.linkedin }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-linkedin" aria-hidden="true"></i><span class="label">LinkedIn</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.xing %}
+        <li>
+          <a href="https://www.xing.com/profile/{{ author.xing }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-xing-square" aria-hidden="true"></i><span class="label">XING</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.instagram %}
+        <li>
+          <a href="https://instagram.com/{{ author.instagram }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-instagram" aria-hidden="true"></i><span class="label">Instagram</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.tumblr %}
+        <li>
+          <a href="https://{{ author.tumblr }}.tumblr.com" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-tumblr-square" aria-hidden="true"></i><span class="label">Tumblr</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.bitbucket %}
+        <li>
+          <a href="https://bitbucket.org/{{ author.bitbucket }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-bitbucket" aria-hidden="true"></i><span class="label">Bitbucket</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.github %}
+        <li>
+          <a href="https://github.com/{{ author.github }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-github" aria-hidden="true"></i><span class="label">GitHub</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.gitlab %}
+        <li>
+          <a href="https://gitlab.com/{{ author.gitlab }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-gitlab" aria-hidden="true"></i><span class="label">GitLab</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.stackoverflow %}
+        <li>
+          <a href="https://stackoverflow.com/users/{{ author.stackoverflow }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-stack-overflow" aria-hidden="true"></i><span class="label">Stack Overflow</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.lastfm %}
+        <li>
+          <a href="https://last.fm/user/{{ author.lastfm }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-lastfm-square" aria-hidden="true"></i><span class="label">Last.fm</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.dribbble %}
+        <li>
+          <a href="https://dribbble.com/{{ author.dribbble }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-dribbble" aria-hidden="true"></i><span class="label">Dribbble</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.pinterest %}
+        <li>
+          <a href="https://www.pinterest.com/{{ author.pinterest }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-pinterest" aria-hidden="true"></i><span class="label">Pinterest</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.foursquare %}
+        <li>
+          <a href="https://foursquare.com/{{ author.foursquare }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-foursquare" aria-hidden="true"></i><span class="label">Foursquare</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.steam %}
+        <li>
+          <a href="https://steamcommunity.com/id/{{ author.steam }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-steam" aria-hidden="true"></i><span class="label">Steam</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.youtube %}
+        {% if author.youtube contains "://" %}
+          <li>
+            <a href="{{ author.youtube }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+              <i class="fab fa-fw fa-youtube" aria-hidden="true"></i><span class="label">YouTube</span>
+            </a>
+          </li>
+        {% elsif author.youtube %}
+          <li>
+            <a href="https://www.youtube.com/user/{{ author.youtube }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+              <i class="fab fa-fw fa-youtube" aria-hidden="true"></i><span class="label">YouTube</span>
+            </a>
+          </li>
+        {% endif %}
+      {% endif %}
+
+      {% if author.soundcloud %}
+        <li>
+          <a href="https://soundcloud.com/{{ author.soundcloud }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-soundcloud" aria-hidden="true"></i><span class="label">SoundCloud</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.weibo %}
+        <li>
+          <a href="https://www.weibo.com/{{ author.weibo }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-weibo" aria-hidden="true"></i><span class="label">Weibo</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.flickr %}
+        <li>
+          <a href="https://www.flickr.com/{{ author.flickr }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-flickr" aria-hidden="true"></i><span class="label">Flickr</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.codepen %}
+        <li>
+          <a href="https://codepen.io/{{ author.codepen }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-codepen" aria-hidden="true"></i><span class="label">CodePen</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% if author.vine %}
+        <li>
+          <a href="https://vine.co/u/{{ author.vine }}" itemprop="sameAs" rel="nofollow noopener noreferrer">
+            <i class="fab fa-fw fa-vine" aria-hidden="true"></i><span class="label">{{ site.data.ui-text[site.locale].email_label | default: "Email" }}</span>
+          </a>
+        </li>
+      {% endif %}
+
+      {% include author-profile-custom-links.html %}
+    </ul>
+  </div>
+</div>
diff --git a/docs/_includes/breadcrumbs.html b/docs/_includes/breadcrumbs.html
new file mode 100644
index 000000000000..cba3d415fa4f
--- /dev/null
+++ b/docs/_includes/breadcrumbs.html
@@ -0,0 +1,39 @@
+{% case site.category_archive.type %}
+  {% when "liquid" %}
+    {% assign path_type = "#" %}
+  {% when "jekyll-archives" %}
+    {% assign path_type = nil %}
+{% endcase %}
+
+{% if page.collection != 'posts' %}
+  {% assign path_type = nil %}
+  {% assign crumb_path = '/' %}
+{% else %}
+  {% assign crumb_path = site.category_archive.path %}
+{% endif %}
+
+<nav class="breadcrumbs">
+  <ol itemscope itemtype="https://schema.org/BreadcrumbList">
+    {% assign crumbs = page.url | split: '/' %}
+    {% assign i = 1 %}
+    {% for crumb in crumbs offset: 1 %}
+      {% if forloop.first %}
+        <li itemprop="itemListElement" itemscope itemtype="https://schema.org/ListItem">
+          <a href="{{ site.url }}{{ site.baseurl }}/" itemprop="item"><span itemprop="name">{{ site.data.ui-text[site.locale].breadcrumb_home_label | default: "Home" }}</span></a>
+          <meta itemprop="position" content="{{ i }}" />
+        </li>
+        <span class="sep">{{ site.data.ui-text[site.locale].breadcrumb_separator | default: "/" }}</span>
+      {% endif %}
+      {% if forloop.last %}
+        <li class="current">{{ page.title }}</li>
+      {% else %}
+        {% assign i = i | plus: 1 %}
+        <li itemprop="itemListElement" itemscope itemtype="https://schema.org/ListItem">
+          <a href="{{ crumb | downcase | replace: '%20', '-' | prepend: path_type | prepend: crumb_path | relative_url }}" itemprop="item"><span itemprop="name">{{ crumb | replace: '-', ' ' | replace: '%20', ' ' | capitalize }}</span></a>
+          <meta itemprop="position" content="{{ i }}" />
+        </li>
+        <span class="sep">{{ site.data.ui-text[site.locale].breadcrumb_separator | default: "/" }}</span>
+      {% endif %}
+    {% endfor %}
+  </ol>
+</nav>
diff --git a/docs/_includes/browser-upgrade.html b/docs/_includes/browser-upgrade.html
new file mode 100644
index 000000000000..ec6ad0acc566
--- /dev/null
+++ b/docs/_includes/browser-upgrade.html
@@ -0,0 +1,3 @@
+<!--[if lt IE 9]>
+<div class="notice--danger align-center" style="margin: 0;">You are using an <strong>outdated</strong> browser. Please <a href="https://browsehappy.com/">upgrade your browser</a> to improve your experience.</div>
+<![endif]-->
diff --git a/docs/_includes/category-list.html b/docs/_includes/category-list.html
new file mode 100644
index 000000000000..d684a2829f3b
--- /dev/null
+++ b/docs/_includes/category-list.html
@@ -0,0 +1,26 @@
+{% case site.category_archive.type %}
+  {% when "liquid" %}
+    {% assign path_type = "#" %}
+  {% when "jekyll-archives" %}
+    {% assign path_type = nil %}
+{% endcase %}
+
+{% if site.category_archive.path %}
+  {% comment %}
+    <!-- Sort alphabetically regardless of case e.g. a B c d E -->
+    <!-- modified from http://www.codeofclimber.ru/2015/sorting-site-tags-in-jekyll/ -->
+  {% endcomment %}
+  {% capture page_categories %}{% for category in page.categories %}{{ category | downcase }}|{{ category }}{% unless forloop.last %},{% endunless %}{% endfor %}{% endcapture %}
+  {% assign category_hashes = page_categories | split: ',' | sort %}
+
+  <p class="page__taxonomy">
+    <strong><i class="fas fa-fw fa-folder-open" aria-hidden="true"></i> {{ site.data.ui-text[site.locale].categories_label | default: "Categories:" }} </strong>
+    <span itemprop="keywords">
+    {% for hash in category_hashes %}
+      {% assign keyValue = hash | split: '|' %}
+      {% capture category_word %}{{ keyValue[1] | strip_newlines }}{% endcapture %}
+      <a href="{{ category_word | slugify | prepend: path_type | prepend: site.category_archive.path | relative_url }}" class="page__taxonomy-item" rel="tag">{{ category_word }}</a>{% unless forloop.last %}<span class="sep">, </span>{% endunless %}
+    {% endfor %}
+    </span>
+  </p>
+{% endif %}
\ No newline at end of file
diff --git a/docs/_includes/comment.html b/docs/_includes/comment.html
new file mode 100644
index 000000000000..2e3013ee2a76
--- /dev/null
+++ b/docs/_includes/comment.html
@@ -0,0 +1,22 @@
+<article id="comment{{ include.index }}" class="js-comment comment" itemprop="comment" itemscope itemtype="https://schema.org/Comment">
+  <div class="comment__avatar-wrapper">
+    <img class="comment__avatar" src="https://www.gravatar.com/avatar/{{ include.email }}?d=mm&s=80" alt="{{ include.name }}">
+  </div>
+  <div class="comment__content-wrapper">
+    <h3 class="comment__author" itemprop="author" itemscope itemtype="https://schema.org/Person">
+      {% unless include.url == blank %}
+        <span itemprop="name"><a rel="external nofollow" itemprop="url" href="{{ include.url }}">{{ include.name }}</a></span>
+      {% else %}
+        <span itemprop="name">{{ include.name }}</span>
+      {% endunless %}
+    </h3>
+    <p class="comment__date">
+      {% if include.date %}
+        {% if include.index %}<a href="#comment{{ include.index }}" itemprop="url">{% endif %}
+        <time datetime="{{ include.date | date_to_xmlschema }}" itemprop="datePublished">{{ include.date | date: "%B %-d, %Y at %I:%M %p" }}</time>
+        {% if include.index %}</a>{% endif %}
+      {% endif %}
+    </p>
+    <div itemprop="text">{{ include.message | markdownify }}</div>
+  </div>
+</article>
diff --git a/docs/_includes/comments.html b/docs/_includes/comments.html
new file mode 100644
index 000000000000..dbb90d1e3a0f
--- /dev/null
+++ b/docs/_includes/comments.html
@@ -0,0 +1,159 @@
+<div class="page__comments">
+  {% capture comments_label %}{{ site.data.ui-text[site.locale].comments_label | default: "Comments" }}{% endcapture %}
+  {% case site.comments.provider %}
+    {% when "discourse" %}
+      <h4 class="page__comments-title">{{ comments_label }}</h4>
+      <section id="discourse-comments"></section>
+    {% when "disqus" %}
+      <h4 class="page__comments-title">{{ comments_label }}</h4>
+      <section id="disqus_thread"></section>
+    {% when "facebook" %}
+      <h4 class="page__comments-title">{{ comments_label }}</h4>
+      <section class="fb-comments" data-href="{{ page.url | absolute_url }}" data-mobile="true" data-num-posts="{{ site.comments.facebook.num_posts | default: 5 }}" data-width="100%" data-colorscheme="{{ site.comments.facebook.colorscheme | default: 'light' }}"></section>
+    {% when "staticman_v2" %}
+      <section id="static-comments">
+        {% if site.repository and site.comments.staticman.branch %}
+          <!-- Start static comments -->
+          <div class="js-comments">
+            {% if site.data.comments[page.slug] %}
+              <h4 class="page__comments-title">{{ site.data.ui-text[site.locale].comments_title | default: "Comments" }}</h4>
+              {% assign comments = site.data.comments[page.slug] | sort %}
+
+              {% for comment in comments %}
+                {% assign email = comment[1].email %}
+                {% assign name = comment[1].name %}
+                {% assign url = comment[1].url %}
+                {% assign date = comment[1].date %}
+                {% assign message = comment[1].message %}
+                {% include comment.html index=forloop.index email=email name=name url=url date=date message=message %}
+              {% endfor %}
+            {% endif %}
+          </div>
+          <!-- End static comments -->
+
+          <!-- Start new comment form -->
+          <div class="page__comments-form">
+            <h4 class="page__comments-title">{{ site.data.ui-text[site.locale].comments_label | default: "Leave a Comment" }}</h4>
+            <p class="small">{{ site.data.ui-text[site.locale].comment_form_info | default: "Your email address will not be published. Required fields are marked" }} <span class="required">*</span></p>
+            <form id="new_comment" class="page__comments-form js-form form" method="post" action="{{ site.comments.staticman.endpoint | default: 'https://api.staticman.net/v2/entry/' }}{{ site.repository }}/{{ site.comments.staticman.branch }}/comments">
+              <div class="form__spinner">
+                <i class="fas fa-spinner fa-spin fa-3x fa-fw"></i>
+                <span class="sr-only">{{ site.data.ui-text[site.locale].loading_label | default: "Loading..." }}</span>
+              </div>
+
+              <div class="form-group">
+                <label for="comment-form-message">{{ site.data.ui-text[site.locale].comment_form_comment_label | default: "Comment" }} <small class="required">*</small></label>
+                <textarea type="text" rows="3" id="comment-form-message" name="fields[message]" tabindex="1"></textarea>
+                <div class="small help-block"><a href="https://daringfireball.net/projects/markdown/">{{ site.data.ui-text[site.locale].comment_form_md_info | default: "Markdown is supported." }}</a></div>
+              </div>
+              <div class="form-group">
+                <label for="comment-form-name">{{ site.data.ui-text[site.locale].comment_form_name_label | default: "Name" }} <small class="required">*</small></label>
+                <input type="text" id="comment-form-name" name="fields[name]" tabindex="2" />
+              </div>
+              <div class="form-group">
+                <label for="comment-form-email">{{ site.data.ui-text[site.locale].comment_form_email_label | default: "Email address" }} <small class="required">*</small></label>
+                <input type="email" id="comment-form-email" name="fields[email]" tabindex="3" />
+              </div>
+              <div class="form-group">
+                <label for="comment-form-url">{{ site.data.ui-text[site.locale].comment_form_website_label | default: "Website (optional)" }}</label>
+                <input type="url" id="comment-form-url" name="fields[url]" tabindex="4"/>
+              </div>
+              <div class="form-group hidden" style="display: none;">
+                <input type="hidden" name="options[slug]" value="{{ page.slug }}">
+                <label for="comment-form-location">Not used. Leave blank if you are a human.</label>
+                <input type="text" id="comment-form-location" name="fields[hidden]" autocomplete="off"/>
+                {% if site.reCaptcha.siteKey %}<input type="hidden" name="options[reCaptcha][siteKey]" value="{{ site.reCaptcha.siteKey }}">{% endif %}
+                {% if site.reCaptcha.secret %}<input type="hidden" name="options[reCaptcha][secret]" value="{{ site.reCaptcha.secret }}">{% endif %}
+              </div>
+              <!-- Start comment form alert messaging -->
+              <p class="hidden js-notice">
+                <strong class="js-notice-text"></strong>
+              </p>
+              <!-- End comment form alert messaging -->
+              {% if site.reCaptcha.siteKey %}
+                <div class="form-group">
+                  <div class="g-recaptcha" data-sitekey="{{ site.reCaptcha.siteKey }}"></div>
+                </div>
+              {% endif %}
+              <div class="form-group">
+                <button type="submit" id="comment-form-submit" tabindex="5" class="btn btn--primary btn--large">{{ site.data.ui-text[site.locale].comment_btn_submit | default: "Submit Comment" }}</button>
+              </div>
+            </form>
+          </div>
+          <!-- End new comment form -->
+          {% if site.reCaptcha.siteKey %}<script async src="https://www.google.com/recaptcha/api.js"></script>{% endif %}
+        {% endif %}
+      </section>
+    {% when "staticman" %}
+      <section id="static-comments">
+        {% if site.repository and site.staticman.branch %}
+          <!-- Start static comments -->
+          <div class="js-comments">
+            {% if site.data.comments[page.slug] %}
+              <h4 class="page__comments-title">{{ site.data.ui-text[site.locale].comments_title | default: "Comments" }}</h4>
+              {% assign comments = site.data.comments[page.slug] | sort %}
+
+              {% for comment in comments %}
+                {% assign email = comment[1].email %}
+                {% assign name = comment[1].name %}
+                {% assign url = comment[1].url %}
+                {% assign date = comment[1].date %}
+                {% assign message = comment[1].message %}
+                {% include comment.html index=forloop.index email=email name=name url=url date=date message=message %}
+              {% endfor %}
+            {% endif %}
+          </div>
+          <!-- End static comments -->
+
+          <!-- Start new comment form -->
+          <div class="page__comments-form">
+            <h4 class="page__comments-title">{{ site.data.ui-text[site.locale].comments_label | default: "Leave a Comment" }}</h4>
+            <p class="small">{{ site.data.ui-text[site.locale].comment_form_info | default: "Your email address will not be published. Required fields are marked" }} <span class="required">*</span></p>
+            <form id="new_comment" class="page__comments-form js-form form" method="post" action="https://api.staticman.net/v1/entry/{{ site.repository }}/{{ site.staticman.branch }}">
+              <div class="form__spinner">
+                <i class="fas fa-spinner fa-spin fa-3x fa-fw"></i>
+                <span class="sr-only">{{ site.data.ui-text[site.locale].loading_label | default: "Loading..." }}</span>
+              </div>
+
+              <div class="form-group">
+                <label for="comment-form-message">{{ site.data.ui-text[site.locale].comment_form_comment_label | default: "Comment" }} <small class="required">*</small></label>
+                <textarea type="text" rows="3" id="comment-form-message" name="fields[message]" tabindex="1"></textarea>
+                <div class="small help-block"><a href="https://daringfireball.net/projects/markdown/">{{ site.data.ui-text[site.locale].comment_form_md_info | default: "Markdown is supported." }}</a></div>
+              </div>
+              <div class="form-group">
+                <label for="comment-form-name">{{ site.data.ui-text[site.locale].comment_form_name_label | default: "Name" }} <small class="required">*</small></label>
+                <input type="text" id="comment-form-name" name="fields[name]" tabindex="2" />
+              </div>
+              <div class="form-group">
+                <label for="comment-form-email">{{ site.data.ui-text[site.locale].comment_form_email_label | default: "Email address" }} <small class="required">*</small></label>
+                <input type="email" id="comment-form-email" name="fields[email]" tabindex="3" />
+              </div>
+              <div class="form-group">
+                <label for="comment-form-url">{{ site.data.ui-text[site.locale].comment_form_website_label | default: "Website (optional)" }}</label>
+                <input type="url" id="comment-form-url" name="fields[url]" tabindex="4"/>
+              </div>
+              <div class="form-group hidden" style="display: none;">
+                <input type="hidden" name="options[slug]" value="{{ page.slug }}">
+                <label for="comment-form-location">Not used. Leave blank if you are a human.</label>
+                <input type="text" id="comment-form-location" name="fields[hidden]" autocomplete="off"/>
+              </div>
+              <!-- Start comment form alert messaging -->
+              <p class="hidden js-notice">
+                <strong class="js-notice-text"></strong>
+              </p>
+              <!-- End comment form alert messaging -->
+              <div class="form-group">
+                <button type="submit" id="comment-form-submit" tabindex="5" class="btn btn--primary btn--large">{{ site.data.ui-text[site.locale].comment_btn_submit | default: "Submit Comment" }}</button>
+              </div>
+            </form>
+          </div>
+          <!-- End new comment form -->
+        {% endif %}
+      </section>
+    {% when "utterances" %}
+      <h4 class="page__comments-title">{{ comments_label }}</h4>
+      <section id="utterances-comments"></section>
+    {% when "custom" %}
+      {% include /comments-providers/custom.html %}
+  {% endcase %}
+</div>
diff --git a/docs/_includes/documents-collection.html b/docs/_includes/documents-collection.html
new file mode 100644
index 000000000000..376a509e3e49
--- /dev/null
+++ b/docs/_includes/documents-collection.html
@@ -0,0 +1,21 @@
+{% assign entries = site[include.collection] %}
+
+{% if include.sort_by == 'title' %}
+  {% if include.sort_order == 'reverse' %}
+    {% assign entries = entries | sort: 'title' | reverse %}
+  {% else %}
+    {% assign entries = entries | sort: 'title' %}
+  {% endif %}
+{% elsif include.sort_by == 'date' %}
+  {% if include.sort_order == 'reverse' %}
+    {% assign entries = entries | sort: 'date' | reverse %}
+  {% else %}
+    {% assign entries = entries | sort: 'date' %}
+  {% endif %}
+{% endif %}
+
+{%- for post in entries -%}
+  {%- unless post.hidden -%}
+    {% include archive-single.html %}
+  {%- endunless -%}
+{%- endfor -%}
diff --git a/docs/_includes/feature_row b/docs/_includes/feature_row
new file mode 100644
index 000000000000..03f09c15cf0c
--- /dev/null
+++ b/docs/_includes/feature_row
@@ -0,0 +1,41 @@
+{% if include.id %}
+  {% assign feature_row = page[include.id] %}
+{% else %}
+  {% assign feature_row = page.feature_row %}
+{% endif %}
+
+<div class="feature__wrapper">
+
+  {% for f in feature_row %}
+    <div class="feature__item{% if include.type %}--{{ include.type }}{% endif %}">
+      <div class="archive__item">
+        {% if f.image_path %}
+          <div class="archive__item-teaser">
+            <img src="{{ f.image_path | relative_url }}"
+                 alt="{% if f.alt %}{{ f.alt }}{% endif %}">
+            {% if f.image_caption %}
+              <span class="archive__item-caption">{{ f.image_caption | markdownify | remove: "<p>" | remove: "</p>" }}</span>
+            {% endif %}
+          </div>
+        {% endif %}
+
+        <div class="archive__item-body">
+          {% if f.title %}
+            <h2 class="archive__item-title">{{ f.title }}</h2>
+          {% endif %}
+
+          {% if f.excerpt %}
+            <div class="archive__item-excerpt">
+              {{ f.excerpt | markdownify }}
+            </div>
+          {% endif %}
+
+          {% if f.url %}
+            <p><a href="{{ f.url | relative_url }}" class="btn {{ f.btn_class }}">{{ f.btn_label | default: site.data.ui-text[site.locale].more_label | default: "Learn More" }}</a></p>
+          {% endif %}
+        </div>
+      </div>
+    </div>
+  {% endfor %}
+
+</div>
diff --git a/docs/_includes/figure b/docs/_includes/figure
new file mode 100644
index 000000000000..f1ce1ebcc110
--- /dev/null
+++ b/docs/_includes/figure
@@ -0,0 +1,9 @@
+<figure class="{{ include.class }}">
+  <img src="{{ include.image_path | relative_url }}"
+       alt="{% if include.alt %}{{ include.alt }}{% endif %}">
+  {% if include.caption %}
+    <figcaption>
+      {{ include.caption | markdownify | remove: "<p>" | remove: "</p>" }}
+    </figcaption>
+  {% endif %}
+</figure>
diff --git a/docs/_includes/footer.html b/docs/_includes/footer.html
new file mode 100644
index 000000000000..2bc78963ce39
--- /dev/null
+++ b/docs/_includes/footer.html
@@ -0,0 +1,19 @@
+<div class="page__footer-follow">
+  <ul class="social-icons">
+    {% if site.data.ui-text[site.locale].follow_label %}
+      <li><strong>{{ site.data.ui-text[site.locale].follow_label }}</strong></li>
+    {% endif %}
+
+    {% if site.footer.links %}
+      {% for link in site.footer.links %}
+        {% if link.label and link.url %}
+          <li><a href="{{ link.url }}" rel="nofollow noopener noreferrer"><i class="{{ link.icon | default: 'fas fa-link' }}" aria-hidden="true"></i> {{ link.label }}</a></li>
+        {% endif %}
+      {% endfor %}
+    {% endif %}
+
+    <li><a href="{% if site.atom_feed.path %}{{ site.atom_feed.path }}{% else %}{{ '/feed.xml' | relative_url }}{% endif %}"><i class="fas fa-fw fa-rss-square" aria-hidden="true"></i> {{ site.data.ui-text[site.locale].feed_label | default: "Feed" }}</a></li>
+  </ul>
+</div>
+
+<div class="page__footer-copyright">&copy; {{ site.time | date: '%Y' }} {{ site.name | default: site.title }}. {{ site.data.ui-text[site.locale].powered_by | default: "Powered by" }} <a href="https://jekyllrb.com" rel="nofollow">Jekyll</a> &amp; <a href="https://mademistakes.com/work/minimal-mistakes-jekyll-theme/" rel="nofollow">Minimal Mistakes</a>.</div>
diff --git a/docs/_includes/gallery b/docs/_includes/gallery
new file mode 100644
index 000000000000..71a9e1e1b3d1
--- /dev/null
+++ b/docs/_includes/gallery
@@ -0,0 +1,35 @@
+{% if include.id %}
+  {% assign gallery = page[include.id] %}
+{% else %}
+  {% assign gallery = page.gallery %}
+{% endif %}
+
+{% if include.layout %}
+  {% assign gallery_layout = include.layout %}
+{% else %}
+  {% if gallery.size == 2 %}
+    {% assign gallery_layout = 'half' %}
+  {% elsif gallery.size >= 3 %}
+    {% assign gallery_layout = 'third' %}
+  {% else %}
+    {% assign gallery_layout = '' %}
+  {% endif %}
+{% endif %}
+
+<figure class="{{ gallery_layout }} {{ include.class }}">
+  {% for img in gallery %}
+    {% if img.url %}
+      <a href="{{ img.url | relative_url }}"
+        {% if img.title %}title="{{ img.title }}"{% endif %}>
+          <img src="{{ img.image_path | relative_url }}"
+               alt="{% if img.alt %}{{ img.alt }}{% endif %}">
+      </a>
+    {% else %}
+      <img src="{{ img.image_path | relative_url }}"
+           alt="{% if img.alt %}{{ img.alt }}{% endif %}">
+    {% endif %}
+  {% endfor %}
+  {% if include.caption %}
+    <figcaption>{{ include.caption | markdownify | remove: "<p>" | remove: "</p>" }}</figcaption>
+  {% endif %}
+</figure>
diff --git a/docs/_includes/group-by-array b/docs/_includes/group-by-array
new file mode 100644
index 000000000000..708de41ae3f8
--- /dev/null
+++ b/docs/_includes/group-by-array
@@ -0,0 +1,47 @@
+<!--
+# Jekyll Group-By-Array 0.1.0
+# https://github.com/mushishi78/jekyll-group-by-array
+# © 2015 Max White <mushishi78@gmail.com>
+# MIT License
+-->
+
+<!-- Initialize -->
+{% assign __empty_array = '' | split: ',' %}
+{% assign group_names = __empty_array %}
+{% assign group_items = __empty_array %}
+
+<!-- Map -->
+{% assign __names =  include.collection | map: include.field %}
+
+<!-- Flatten -->
+{% assign __names =  __names | join: ',' | join: ',' | split: ',' %}
+
+<!-- Uniq -->
+{% assign __names =  __names | sort %}
+{% for name in __names %}
+
+<!-- If not equal to previous then it must be unique as sorted -->
+{% unless name == previous %}
+
+<!-- Push to group_names -->
+{% assign group_names = group_names | push: name %}
+{% endunless %}
+
+{% assign previous = name %}
+{% endfor %}
+
+
+<!-- group_items -->
+{% for name in group_names %}
+
+<!-- Collect if contains -->
+{% assign __item = __empty_array %}
+{% for __element in include.collection %}
+{% if __element[include.field] contains name %}
+{% assign __item = __item | push: __element %}
+{% endif %}
+{% endfor %}
+
+<!-- Push to group_items -->
+{% assign group_items = group_items | push: __item %}
+{% endfor %}
\ No newline at end of file
diff --git a/docs/_includes/head.html b/docs/_includes/head.html
new file mode 100644
index 000000000000..3b99471f5ec5
--- /dev/null
+++ b/docs/_includes/head.html
@@ -0,0 +1,37 @@
+<meta charset="utf-8">
+
+{% include seo.html %}
+
+<link href="{% if site.atom_feed.path %}{{ site.atom_feed.path }}{% else %}{{ '/feed.xml' | relative_url }}{% endif %}" type="application/atom+xml" rel="alternate" title="{{ site.title }} Feed">
+
+<!-- https://t.co/dKP3o1e -->
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+
+<script>
+  document.documentElement.className = document.documentElement.className.replace(/\bno-js\b/g, '') + ' js ';
+</script>
+
+<!-- For all browsers -->
+<link rel="stylesheet" href="{{ '/assets/css/main.css' | relative_url }}">
+<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/@fortawesome/fontawesome-free@5/css/all.min.css">
+
+<!--[if IE]>
+  <style>
+    /* old IE unsupported flexbox fixes */
+    .greedy-nav .site-title {
+      padding-right: 3em;
+    }
+    .greedy-nav button {
+      position: absolute;
+      top: 0;
+      right: 0;
+      height: 100%;
+    }
+  </style>
+<![endif]-->
+
+{% if site.head_scripts %}
+  {% for script in site.head_scripts %}
+    <script src="{{ script | relative_url }}"></script>
+  {% endfor %}
+{% endif %}
diff --git a/docs/_includes/masthead.html b/docs/_includes/masthead.html
new file mode 100644
index 000000000000..47cce0a3545e
--- /dev/null
+++ b/docs/_includes/masthead.html
@@ -0,0 +1,37 @@
+{% capture logo_path %}{{ site.logo }}{% endcapture %}
+
+<div class="masthead">
+  <div class="masthead__inner-wrap">
+    <div class="masthead__menu">
+      <nav id="site-nav" class="greedy-nav">
+        {% unless logo_path == empty %}
+          <a class="site-logo" href="{{ '/' | relative_url }}"><img src="{{ logo_path | relative_url }}" alt=""></a>
+        {% endunless %}
+        <a class="site-title" href="{{ '/' | relative_url }}">
+          {{ site.masthead_title | default: site.title }}
+          {% if site.subtitle %}<span class="site-subtitle">{{ site.subtitle }}</span>{% endif %}
+        </a>
+        <ul class="visible-links">
+          {%- for link in site.data.navigation.main -%}
+            <li class="masthead__menu-item">
+              <a href="{{ link.url | relative_url }}"{% if link.description %} title="{{ link.description }}"{% endif %}>{{ link.title }}</a>
+            </li>
+          {%- endfor -%}
+        </ul>
+        {% if site.search == true %}
+        <button class="search__toggle" type="button">
+          <span class="visually-hidden">{{ site.data.ui-text[site.locale].search_label | default: "Toggle search" }}</span>
+          <svg class="icon" width="16" height="16" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 15.99 16">
+            <path d="M15.5,13.12L13.19,10.8a1.69,1.69,0,0,0-1.28-.55l-0.06-.06A6.5,6.5,0,0,0,5.77,0,6.5,6.5,0,0,0,2.46,11.59a6.47,6.47,0,0,0,7.74.26l0.05,0.05a1.65,1.65,0,0,0,.5,1.24l2.38,2.38A1.68,1.68,0,0,0,15.5,13.12ZM6.4,2A4.41,4.41,0,1,1,2,6.4,4.43,4.43,0,0,1,6.4,2Z" transform="translate(-.01)"></path>
+          </svg>
+        </button>
+        {% endif %}
+        <button class="greedy-nav__toggle hidden" type="button">
+          <span class="visually-hidden">{{ site.data.ui-text[site.locale].menu_label | default: "Toggle menu" }}</span>
+          <div class="navicon"></div>
+        </button>
+        <ul class="hidden-links hidden"></ul>
+      </nav>
+    </div>
+  </div>
+</div>
diff --git a/docs/_includes/nav_list b/docs/_includes/nav_list
new file mode 100644
index 000000000000..a035a5bd7b15
--- /dev/null
+++ b/docs/_includes/nav_list
@@ -0,0 +1,26 @@
+{% assign navigation = site.data.navigation[include.nav] %}
+
+<nav class="nav__list">
+  {% if page.sidebar.title %}<h3 class="nav__title" style="padding-left: 0;">{{ page.sidebar.title }}</h3>{% endif %}
+  <input id="ac-toc" name="accordion-toc" type="checkbox" />
+  <label for="ac-toc">{{ site.data.ui-text[site.locale].menu_label | default: "Toggle Menu" }}</label>
+  <ul class="nav__items">
+    {% for nav in navigation %}
+      <li>
+        {% if nav.url %}
+          <a href="{{ nav.url | relative_url }}"><span class="nav__sub-title">{{ nav.title }}</span></a>
+        {% else %}
+          <span class="nav__sub-title">{{ nav.title }}</span>
+        {% endif %}
+
+        {% if nav.children != null %}
+        <ul>
+          {% for child in nav.children %}
+            <li><a href="{{ child.url | relative_url }}"{% if child.url == page.url %} class="active"{% endif %}>{{ child.title }}</a></li>
+          {% endfor %}
+        </ul>
+        {% endif %}
+      </li>
+    {% endfor %}
+  </ul>
+</nav>
diff --git a/docs/_includes/page__date.html b/docs/_includes/page__date.html
new file mode 100644
index 000000000000..e663f9b9c7f0
--- /dev/null
+++ b/docs/_includes/page__date.html
@@ -0,0 +1,5 @@
+{% if page.last_modified_at %}
+  <p class="page__date"><strong><i class="fas fa-fw fa-calendar-alt" aria-hidden="true"></i> {{ site.data.ui-text[site.locale].date_label | default: "Updated:" }}</strong> <time datetime="{{ page.last_modified_at | date: "%Y-%m-%d" }}">{{ page.last_modified_at | date: "%B %-d, %Y" }}</time></p>
+{% elsif page.date %}
+  <p class="page__date"><strong><i class="fas fa-fw fa-calendar-alt" aria-hidden="true"></i> {{ site.data.ui-text[site.locale].date_label | default: "Updated:" }}</strong> <time datetime="{{ page.date | date_to_xmlschema }}">{{ page.date | date: "%B %-d, %Y" }}</time></p>
+{% endif %}
diff --git a/docs/_includes/page__hero.html b/docs/_includes/page__hero.html
new file mode 100644
index 000000000000..3f55aaa60ac5
--- /dev/null
+++ b/docs/_includes/page__hero.html
@@ -0,0 +1,51 @@
+{% capture overlay_img_path %}{{ page.header.overlay_image | relative_url }}{% endcapture %}
+
+{% if page.header.overlay_filter contains "rgba" %}
+  {% capture overlay_filter %}{{ page.header.overlay_filter }}{% endcapture %}
+{% elsif page.header.overlay_filter %}
+  {% capture overlay_filter %}rgba(0, 0, 0, {{ page.header.overlay_filter }}){% endcapture %}
+{% endif %}
+
+{% if page.header.image_description %}
+  {% assign image_description = page.header.image_description %}
+{% else %}
+  {% assign image_description = page.title %}
+{% endif %}
+
+{% assign image_description = image_description | markdownify | strip_html | strip_newlines | escape_once %}
+
+<div class="page__hero{% if page.header.overlay_color or page.header.overlay_image %}--overlay{% endif %}"
+  style="{% if page.header.overlay_color %}background-color: {{ page.header.overlay_color | default: 'transparent' }};{% endif %} {% if overlay_img_path %}background-image: {% if overlay_filter %}linear-gradient({{ overlay_filter }}, {{ overlay_filter }}), {% endif %}url('{{ overlay_img_path }}');{% endif %}"
+>
+  {% if page.header.overlay_color or page.header.overlay_image %}
+    <div class="wrapper">
+      <h1 id="page-title" class="page__title" itemprop="headline">
+        {% if paginator and site.paginate_show_page_num %}
+          {{ site.title }}{% unless paginator.page == 1 %} {{ site.data.ui-text[site.locale].page | default: "Page" }} {{ paginator.page }}{% endunless %}
+        {% else %}
+          {{ page.title | default: site.title | markdownify | remove: "<p>" | remove: "</p>" }}
+        {% endif %}
+      </h1>
+      {% if page.tagline %}
+        <p class="page__lead">{{ page.tagline | markdownify | remove: "<p>" | remove: "</p>" }}</p>
+      {% elsif page.header.show_overlay_excerpt != false and page.excerpt %}
+        <p class="page__lead">{{ page.excerpt | markdownify | remove: "<p>" | remove: "</p>" }}</p>
+      {% endif %}
+      {% include page__meta.html %}
+      {% if page.header.cta_url %}
+        <p><a href="{{ page.header.cta_url | relative_url }}" class="btn btn--light-outline btn--large">{{ page.header.cta_label | default: site.data.ui-text[site.locale].more_label | default: "Learn More" }}</a></p>
+      {% endif %}
+      {% if page.header.actions %}
+        <p>
+        {% for action in page.header.actions %}
+          <a href="{{ action.url | relative_url }}" class="btn btn--light-outline btn--large">{{ action.label | default: site.data.ui-text[site.locale].more_label | default: "Learn More" }}</a>
+        {% endfor %}
+      {% endif %}
+    </div>
+  {% else %}
+    <img src="{{ page.header.image | relative_url }}" alt="{{ image_description }}" class="page__hero-image">
+  {% endif %}
+  {% if page.header.caption %}
+    <span class="page__hero-caption">{{ page.header.caption | markdownify | remove: "<p>" | remove: "</p>" }}</span>
+  {% endif %}
+</div>
diff --git a/docs/_includes/page__hero_video.html b/docs/_includes/page__hero_video.html
new file mode 100644
index 000000000000..a313a23d45b9
--- /dev/null
+++ b/docs/_includes/page__hero_video.html
@@ -0,0 +1,2 @@
+{% assign video = page.header.video %}
+{% include video id=video.id provider=video.provider danmaku=video.danmaku %}
diff --git a/docs/_includes/page__meta.html b/docs/_includes/page__meta.html
new file mode 100644
index 000000000000..1afc3d8f85eb
--- /dev/null
+++ b/docs/_includes/page__meta.html
@@ -0,0 +1,30 @@
+{% assign document = post | default: page %}
+{% if document.read_time or document.show_date %}
+  <p class="page__meta">
+    {% if document.show_date and document.date %}
+      {% assign date = document.date %}
+      <span class="page__meta-date">
+        <i class="far {% if include.type == 'grid' and document.read_time and document.show_date %}fa-fw {% endif %}fa-calendar-alt" aria-hidden="true"></i>
+        <time datetime="{{ date | date_to_xmlschema }}">{{ date | date: "%B %-d, %Y" }}</time>
+      </span>
+    {% endif %}
+
+    {% if document.read_time and document.show_date %}<span class="page__meta-sep"></span>{% endif %}
+
+    {% if document.read_time %}
+      {% assign words_per_minute = document.words_per_minute | default: site.words_per_minute | default: 200 %}
+      {% assign words = document.content | strip_html | number_of_words %}
+
+      <span class="page__meta-readtime">
+        <i class="far {% if include.type == 'grid' and document.read_time and document.show_date %}fa-fw {% endif %}fa-clock" aria-hidden="true"></i>
+        {% if words < words_per_minute %}
+          {{ site.data.ui-text[site.locale].less_than | default: "less than" }} 1 {{ site.data.ui-text[site.locale].minute_read | default: "minute read" }}
+        {% elsif words == words_per_minute %}
+          1 {{ site.data.ui-text[site.locale].minute_read | default: "minute read" }}
+        {% else %}
+          {{ words | divided_by: words_per_minute }} {{ site.data.ui-text[site.locale].minute_read | default: "minute read" }}
+        {% endif %}
+      </span>
+    {% endif %}
+  </p>
+{% endif %}
diff --git a/docs/_includes/page__taxonomy.html b/docs/_includes/page__taxonomy.html
new file mode 100644
index 000000000000..75c76c81ddf2
--- /dev/null
+++ b/docs/_includes/page__taxonomy.html
@@ -0,0 +1,7 @@
+{% if site.tag_archive.type and page.tags[0] %}
+  {% include tag-list.html %}
+{% endif %}
+
+{% if site.category_archive.type and page.categories[0] %}
+  {% include category-list.html %}
+{% endif %}
\ No newline at end of file
diff --git a/docs/_includes/paginator.html b/docs/_includes/paginator.html
new file mode 100644
index 000000000000..bffa0794678e
--- /dev/null
+++ b/docs/_includes/paginator.html
@@ -0,0 +1,69 @@
+{% if paginator.total_pages > 1 %}
+<nav class="pagination">
+  {% assign first_page_path = paginator.first_page_path | default: site.paginate_path | replace: 'page:num', '' | replace: '//', '/' | relative_url %}
+  <ul>
+    {% comment %} Link for previous page {% endcomment %}
+    {% if paginator.previous_page %}
+      {% if paginator.previous_page == 1 %}
+        <li><a href="{{ first_page_path }}">{{ site.data.ui-text[site.locale].pagination_previous | default: "Previous" }}</a></li>
+      {% else %}
+        <li><a href="{{ site.paginate_path | replace: ':num', paginator.previous_page | replace: '//', '/' | relative_url }}">{{ site.data.ui-text[site.locale].pagination_previous | default: "Previous" }}</a></li>
+      {% endif %}
+    {% else %}
+    <li><a href="#" class="disabled"><span aria-hidden="true">{{ site.data.ui-text[site.locale].pagination_previous | default: "Previous" }}</span></a></li>
+    {% endif %}
+
+    {% comment %} First page {% endcomment %}
+    {% if paginator.page == 1 %}
+      <li><a href="#" class="disabled current">1</a></li>
+    {% else %}
+      <li><a href="{{ first_page_path }}">1</a></li>
+    {% endif %}
+
+    {% assign page_start = 2 %}
+    {% if paginator.page > 4 %}
+      {% assign page_start = paginator.page | minus: 2 %}
+      {% comment %} Ellipsis for truncated links {% endcomment %}
+      <li><a href="#" class="disabled">&hellip;</a></li>
+    {% endif %}
+
+    {% assign page_end = paginator.total_pages | minus: 1 %}
+    {% assign pages_to_end = paginator.total_pages | minus: paginator.page %}
+    {% if pages_to_end > 4 %}
+      {% assign page_end = paginator.page | plus: 2 %}
+    {% endif %}
+
+    {% for index in (page_start..page_end) %}
+      {% if index == paginator.page %}
+        <li><a href="{{ site.paginate_path | replace: ':num', index | replace: '//', '/' | relative_url }}" class="disabled current">{{ index }}</a></li>
+      {% else %}
+        {% comment %} Distance from current page and this link {% endcomment %}
+        {% assign dist = paginator.page | minus: index %}
+        {% if dist < 0 %}
+          {% comment %} Distance must be a positive value {% endcomment %}
+          {% assign dist = 0 | minus: dist %}
+        {% endif %}
+        <li><a href="{{ site.paginate_path | replace: ':num', index | relative_url }}">{{ index }}</a></li>
+      {% endif %}
+    {% endfor %}
+
+    {% comment %} Ellipsis for truncated links {% endcomment %}
+    {% if pages_to_end > 3 %}
+      <li><a href="#" class="disabled">&hellip;</a></li>
+    {% endif %}
+
+    {% if paginator.page == paginator.total_pages %}
+      <li><a href="#" class="disabled current">{{ paginator.page }}</a></li>
+    {% else %}
+      <li><a href="{{ site.paginate_path | replace: ':num', paginator.total_pages | replace: '//', '/' | relative_url }}">{{ paginator.total_pages }}</a></li>
+    {% endif %}
+
+    {% comment %} Link next page {% endcomment %}
+    {% if paginator.next_page %}
+      <li><a href="{{ site.paginate_path | replace: ':num', paginator.next_page | replace: '//', '/' | relative_url }}">{{ site.data.ui-text[site.locale].pagination_next | default: "Next" }}</a></li>
+    {% else %}
+      <li><a href="#" class="disabled"><span aria-hidden="true">{{ site.data.ui-text[site.locale].pagination_next | default: "Next" }}</span></a></li>
+    {% endif %}
+  </ul>
+</nav>
+{% endif %}
diff --git a/docs/_includes/post_pagination.html b/docs/_includes/post_pagination.html
new file mode 100644
index 000000000000..a93c6279763b
--- /dev/null
+++ b/docs/_includes/post_pagination.html
@@ -0,0 +1,14 @@
+{% if page.previous or page.next %}
+  <nav class="pagination">
+    {% if page.previous %}
+      <a href="{{ page.previous.url | relative_url }}" class="pagination--pager" title="{{ page.previous.title | markdownify | strip_html }}">{{ site.data.ui-text[site.locale].pagination_previous | default: "Previous" }}</a>
+    {% else %}
+      <a href="#" class="pagination--pager disabled">{{ site.data.ui-text[site.locale].pagination_previous | default: "Previous" }}</a>
+    {% endif %}
+    {% if page.next %}
+      <a href="{{ page.next.url | relative_url }}" class="pagination--pager" title="{{ page.next.title | markdownify | strip_html }}">{{ site.data.ui-text[site.locale].pagination_next | default: "Next" }}</a>
+    {% else %}
+      <a href="#" class="pagination--pager disabled">{{ site.data.ui-text[site.locale].pagination_next | default: "Next" }}</a>
+    {% endif %}
+  </nav>
+{% endif %}
\ No newline at end of file
diff --git a/docs/_includes/posts-category.html b/docs/_includes/posts-category.html
new file mode 100644
index 000000000000..b364f30e94e5
--- /dev/null
+++ b/docs/_includes/posts-category.html
@@ -0,0 +1,5 @@
+{%- for post in site.categories[include.taxonomy] -%}
+  {%- unless post.hidden -%}
+    {% include archive-single.html %}
+  {%- endunless -%}
+{%- endfor -%}
diff --git a/docs/_includes/posts-tag.html b/docs/_includes/posts-tag.html
new file mode 100644
index 000000000000..46fade02a01f
--- /dev/null
+++ b/docs/_includes/posts-tag.html
@@ -0,0 +1,5 @@
+{%- for post in site.tags[include.taxonomy] -%}
+  {%- unless post.hidden -%}
+    {% include archive-single.html %}
+  {%- endunless -%}
+{%- endfor -%}
diff --git a/docs/_includes/scripts.html b/docs/_includes/scripts.html
new file mode 100644
index 000000000000..bbdaddff0bab
--- /dev/null
+++ b/docs/_includes/scripts.html
@@ -0,0 +1,28 @@
+{% if site.footer_scripts %}
+  {% for script in site.footer_scripts %}
+    <script src="{{ script | relative_url }}"></script>
+  {% endfor %}
+{% else %}
+  <script src="{{ '/assets/js/main.min.js' | relative_url }}"></script>
+{% endif %}
+
+{% if site.search == true or page.layout == "search" %}
+  {%- assign search_provider = site.search_provider | default: "lunr" -%}
+  {%- case search_provider -%}
+    {%- when "lunr" -%}
+      {% include_cached search/lunr-search-scripts.html %}
+    {%- when "google" -%}
+      {% include_cached search/google-search-scripts.html %}
+    {%- when "algolia" -%}
+      {% include_cached search/algolia-search-scripts.html %}
+  {%- endcase -%}
+{% endif %}
+
+{% include analytics.html %}
+{% include /comments-providers/scripts.html %}
+
+{% if site.after_footer_scripts %}
+  {% for script in site.after_footer_scripts %}
+    <script src="{{ script | relative_url }}"></script>
+  {% endfor %}
+{% endif %}
diff --git a/docs/_includes/seo.html b/docs/_includes/seo.html
new file mode 100644
index 000000000000..7df1253b7f85
--- /dev/null
+++ b/docs/_includes/seo.html
@@ -0,0 +1,155 @@
+<!-- begin _includes/seo.html -->
+{%- if site.url -%}
+  {%- assign seo_url = site.url | append: site.baseurl -%}
+{%- endif -%}
+{%- assign seo_url = seo_url | default: site.github.url -%}
+
+{% assign title_separator = site.title_separator | default: '-' | replace: '|', '&#124;' %}
+
+{%- if page.title -%}
+  {%- assign seo_title = page.title | append: " " | append: title_separator | append: " " | append: site.title -%}
+{%- endif -%}
+
+{%- if seo_title -%}
+  {%- assign seo_title = seo_title | markdownify | strip_html | strip_newlines | escape_once -%}
+{%- endif -%}
+
+{% if page.canonical_url %}
+  {%- assign canonical_url = page.canonical_url %}
+{% else %}
+  {%- assign canonical_url = page.url | replace: "index.html", "" | absolute_url %}
+{% endif %}
+
+{%- assign seo_description = page.description | default: page.excerpt | default: site.description -%}
+{%- if seo_description -%}
+  {%- assign seo_description = seo_description | markdownify | strip_html | newline_to_br | strip_newlines | replace: '<br />', ' ' | escape_once | strip -%}
+{%- endif -%}
+
+{%- assign author = page.author | default: page.authors[0] | default: site.author -%}
+{%- assign author = site.data.authors[author] | default: author -%}
+
+{%- if author.twitter -%}
+  {%- assign author_twitter = author.twitter | replace: "@", "" -%}
+{%- endif -%}
+
+{%- assign page_large_image = page.header.og_image | default: page.header.overlay_image | default: page.header.image | absolute_url -%}
+{%- assign page_large_image = page_large_image | escape -%}
+
+{%- assign page_teaser_image = page.header.teaser | default: site.og_image | absolute_url -%}
+{%- assign page_teaser_image = page_teaser_image | escape -%}
+
+{%- assign site_og_image = site.og_image | absolute_url -%}
+{%- assign site_og_image = site_og_image | escape -%}
+
+{%- if page.date -%}
+  {%- assign og_type = "article" -%}
+{%- else -%}
+  {%- assign og_type = "website" -%}
+{%- endif -%}
+
+<title>{{ seo_title | default: site.title }}{% if paginator %}{% unless paginator.page == 1 %} {{ title_separator }} {{ site.data.ui-text[site.locale].page | default: "Page" }} {{ paginator.page }}{% endunless %}{% endif %}</title>
+<meta name="description" content="{{ seo_description }}">
+
+{% if author.name %}
+  <meta name="author" content="{{ author.name | default: author }}">
+  {% if og_type == "article" %}
+  <meta property="article:author" content="{{ author.name | default: author }}">
+  {% endif %}
+{% endif %}
+
+<meta property="og:type" content="{{ og_type }}">
+<meta property="og:locale" content="{{ site.locale | replace: "-", "_" | default: "en_US" }}">
+<meta property="og:site_name" content="{{ site.title }}">
+<meta property="og:title" content="{{ page.title | default: site.title | markdownify | strip_html | strip_newlines | escape_once }}">
+<meta property="og:url" content="{{ canonical_url }}">
+
+{% if seo_description %}
+  <meta property="og:description" content="{{ seo_description }}">
+{% endif %}
+
+{% if page_large_image %}
+  <meta property="og:image" content="{{ page_large_image }}">
+{% elsif page_teaser_image %}
+  <meta property="og:image" content="{{ page_teaser_image }}">
+{% endif %}
+
+{% if site.twitter.username %}
+  <meta name="twitter:site" content="@{{ site.twitter.username | replace: "@", "" }}">
+  <meta name="twitter:title" content="{{ page.title | default: site.title | markdownify | strip_html | strip_newlines | escape_once }}">
+  <meta name="twitter:description" content="{{ seo_description }}">
+  <meta name="twitter:url" content="{{ canonical_url }}">
+
+  {% if page_large_image %}
+    <meta name="twitter:card" content="summary_large_image">
+    <meta name="twitter:image" content="{{ page_large_image }}">
+  {% else %}
+    <meta name="twitter:card" content="summary">
+    {% if page_teaser_image %}
+      <meta name="twitter:image" content="{{ page_teaser_image }}">
+    {% endif %}
+  {% endif %}
+
+  {% if author_twitter %}
+    <meta name="twitter:creator" content="@{{ author_twitter }}">
+  {% endif %}
+{% endif %}
+
+{% if page.date %}
+  <meta property="article:published_time" content="{{ page.date | date_to_xmlschema }}">
+{% endif %}
+
+{% if og_type == "article" and page.last_modified_at %}
+  <meta property="article:modified_time" content="{{ page.last_modified_at | date_to_xmlschema }}">
+{% endif %}
+
+{% if site.facebook %}
+  {% if site.facebook.publisher %}
+    <meta property="article:publisher" content="{{ site.facebook.publisher }}">
+  {% endif %}
+
+  {% if site.facebook.app_id %}
+    <meta property="fb:app_id" content="{{ site.facebook.app_id }}">
+  {% endif %}
+{% endif %}
+
+<link rel="canonical" href="{{ canonical_url }}">
+
+{% if paginator.previous_page %}
+  <link rel="prev" href="{{ paginator.previous_page_path | absolute_url }}">
+{% endif %}
+{% if paginator.next_page %}
+  <link rel="next" href="{{ paginator.next_page_path | absolute_url }}">
+{% endif %}
+
+<script type="application/ld+json">
+  {
+    "@context": "https://schema.org",
+    {% if site.social.type == "Organization" %}
+      "@type": "Organization",
+      "url": {{ '/' | absolute_url | jsonify }}{% if site.og_image %},
+      "logo": {{ site_og_image | jsonify }}{% endif %}
+    {% else %}
+      "@type": "Person",
+      "name": {{ site.social.name | default: site.name | jsonify }},
+      "url": {{ '/' | absolute_url |jsonify }}{% if site.social.links %},
+      "sameAs": {{ site.social.links | jsonify }}{% endif %}
+    {% endif %}
+  }
+</script>
+
+{% if site.google_site_verification %}
+  <meta name="google-site-verification" content="{{ site.google_site_verification }}" />
+{% endif %}
+{% if site.bing_site_verification %}
+  <meta name="msvalidate.01" content="{{ site.bing_site_verification }}">
+{% endif %}
+{% if site.alexa_site_verification %}
+  <meta name="alexaVerifyID" content="{{ site.alexa_site_verification }}">
+{% endif %}
+{% if site.yandex_site_verification %}
+  <meta name="yandex-verification" content="{{ site.yandex_site_verification }}">
+{% endif %}
+{% if site.naver_site_verification %}
+  <meta name="naver-site-verification" content="{{ site.naver_site_verification }}">
+{% endif %}
+<!-- end _includes/seo.html -->
diff --git a/docs/_includes/sidebar.html b/docs/_includes/sidebar.html
new file mode 100644
index 000000000000..a4ca1ca78151
--- /dev/null
+++ b/docs/_includes/sidebar.html
@@ -0,0 +1,19 @@
+{% if page.author_profile or layout.author_profile or page.sidebar %}
+  <div class="sidebar sticky">
+  {% if page.author_profile or layout.author_profile %}{% include author-profile.html %}{% endif %}
+  {% if page.sidebar %}
+    {% for s in page.sidebar %}
+      {% if s.image %}
+        <img src="{{ s.image | relative_url }}"
+             alt="{% if s.image_alt %}{{ s.image_alt }}{% endif %}">
+      {% endif %}
+      {% if s.title %}<h3>{{ s.title }}</h3>{% endif %}
+      {% if s.text %}{{ s.text | markdownify }}{% endif %}
+      {% if s.nav %}{% include nav_list nav=s.nav %}{% endif %}
+    {% endfor %}
+    {% if page.sidebar.nav %}
+      {% include nav_list nav=page.sidebar.nav %}
+    {% endif %}
+  {% endif %}
+  </div>
+{% endif %}
diff --git a/docs/_includes/skip-links.html b/docs/_includes/skip-links.html
new file mode 100644
index 000000000000..2cd9f17d814a
--- /dev/null
+++ b/docs/_includes/skip-links.html
@@ -0,0 +1,8 @@
+<nav class="skip-links">
+  <h2 class="screen-reader-text">{{ site.data.ui-text[site.locale].skip_links | default: 'Skip links' }}</h2>
+  <ul>
+    <li><a href="#site-nav" class="screen-reader-shortcut">{{ site.data.ui-text[site.locale].skip_primary_nav | default: 'Skip to primary navigation' }}</a></li>
+    <li><a href="#main" class="screen-reader-shortcut">{{ site.data.ui-text[site.locale].skip_content | default: 'Skip to content' }}</a></li>
+    <li><a href="#footer" class="screen-reader-shortcut">{{ site.data.ui-text[site.locale].skip_footer | default: 'Skip to footer' }}</a></li>
+  </ul>
+</nav>
diff --git a/docs/_includes/social-share.html b/docs/_includes/social-share.html
new file mode 100644
index 000000000000..0b377982b268
--- /dev/null
+++ b/docs/_includes/social-share.html
@@ -0,0 +1,11 @@
+<section class="page__share">
+  {% if site.data.ui-text[site.locale].share_on_label %}
+    <h4 class="page__share-title">{{ site.data.ui-text[site.locale].share_on_label | default: "Share on" }}</h4>
+  {% endif %}
+
+  <a href="https://twitter.com/intent/tweet?{% if site.twitter.username %}via={{ site.twitter.username | url_encode }}&{% endif %}text={{ page.title | url_encode }}%20{{ page.url | absolute_url | url_encode }}" class="btn btn--twitter" onclick="window.open(this.href, 'window', 'left=20,top=20,width=500,height=500,toolbar=1,resizable=0'); return false;" title="{{ site.data.ui-text[site.locale].share_on_label | default: 'Share on' }} Twitter"><i class="fab fa-fw fa-twitter" aria-hidden="true"></i><span> Twitter</span></a>
+
+  <a href="https://www.facebook.com/sharer/sharer.php?u={{ page.url | absolute_url | url_encode }}" class="btn btn--facebook" onclick="window.open(this.href, 'window', 'left=20,top=20,width=500,height=500,toolbar=1,resizable=0'); return false;" title="{{ site.data.ui-text[site.locale].share_on_label | default: 'Share on' }} Facebook"><i class="fab fa-fw fa-facebook" aria-hidden="true"></i><span> Facebook</span></a>
+
+  <a href="https://www.linkedin.com/shareArticle?mini=true&url={{ page.url | absolute_url | url_encode }}" class="btn btn--linkedin" onclick="window.open(this.href, 'window', 'left=20,top=20,width=500,height=500,toolbar=1,resizable=0'); return false;" title="{{ site.data.ui-text[site.locale].share_on_label | default: 'Share on' }} LinkedIn"><i class="fab fa-fw fa-linkedin" aria-hidden="true"></i><span> LinkedIn</span></a>
+</section>
diff --git a/docs/_includes/tag-list.html b/docs/_includes/tag-list.html
new file mode 100644
index 000000000000..e0d02bfa561a
--- /dev/null
+++ b/docs/_includes/tag-list.html
@@ -0,0 +1,26 @@
+{% case site.tag_archive.type %}
+  {% when "liquid" %}
+    {% assign path_type = "#" %}
+  {% when "jekyll-archives" %}
+    {% assign path_type = nil %}
+{% endcase %}
+
+{% if site.tag_archive.path %}
+  {% comment %}
+    <!-- Sort alphabetically regardless of case e.g. a B c d E -->
+    <!-- modified from http://www.codeofclimber.ru/2015/sorting-site-tags-in-jekyll/ -->
+  {% endcomment %}
+  {% capture page_tags %}{% for tag in page.tags %}{{ tag | downcase }}|{{ tag }}{% unless forloop.last %},{% endunless %}{% endfor %}{% endcapture %}
+  {% assign tag_hashes = page_tags | split: ',' | sort %}
+
+  <p class="page__taxonomy">
+    <strong><i class="fas fa-fw fa-tags" aria-hidden="true"></i> {{ site.data.ui-text[site.locale].tags_label | default: "Tags:" }} </strong>
+    <span itemprop="keywords">
+    {% for hash in tag_hashes %}
+      {% assign keyValue = hash | split: '|' %}
+      {% capture tag_word %}{{ keyValue[1] | strip_newlines }}{% endcapture %}
+      <a href="{{ tag_word | slugify | prepend: path_type | prepend: site.tag_archive.path | relative_url }}" class="page__taxonomy-item" rel="tag">{{ tag_word }}</a>{% unless forloop.last %}<span class="sep">, </span>{% endunless %}
+    {% endfor %}
+    </span>
+  </p>
+{% endif %}
\ No newline at end of file
diff --git a/docs/_includes/toc b/docs/_includes/toc
new file mode 100644
index 000000000000..6423ccdc72e1
--- /dev/null
+++ b/docs/_includes/toc
@@ -0,0 +1,7 @@
+<aside class="sidebar__right">
+<nav class="toc" markdown="1">
+<header><h4 class="nav__title"><i class="fas fa-{{ include.icon | default: 'file-alt' }}"></i> {{ include.title | default: site.data.ui-text[site.locale].toc_label }}</h4></header>
+*  Auto generated table of contents
+{:toc .toc__menu}
+</nav>
+</aside>
\ No newline at end of file
diff --git a/docs/_includes/toc.html b/docs/_includes/toc.html
new file mode 100644
index 000000000000..25b9f6a382b0
--- /dev/null
+++ b/docs/_includes/toc.html
@@ -0,0 +1,96 @@
+{% capture tocWorkspace %}
+    {% comment %}
+        Version 1.0.8
+          https://github.com/allejo/jekyll-toc
+
+        "...like all things liquid - where there's a will, and ~36 hours to spare, there's usually a/some way" ~jaybe
+
+        Usage:
+            {% include toc.html html=content sanitize=true class="inline_toc" id="my_toc" h_min=2 h_max=3 %}
+
+        Parameters:
+            * html         (string) - the HTML of compiled markdown generated by kramdown in Jekyll
+
+        Optional Parameters:
+            * sanitize     (bool)   : false  - when set to true, the headers will be stripped of any HTML in the TOC
+            * class        (string) :   ''   - a CSS class assigned to the TOC
+            * id           (string) :   ''   - an ID to assigned to the TOC
+            * h_min        (int)    :   1    - the minimum TOC header level to use; any header lower than this value will be ignored
+            * h_max        (int)    :   6    - the maximum TOC header level to use; any header greater than this value will be ignored
+            * ordered      (bool)   : false  - when set to true, an ordered list will be outputted instead of an unordered list
+            * item_class   (string) :   ''   - add custom class(es) for each list item; has support for '%level%' placeholder, which is the current heading level
+            * baseurl      (string) :   ''   - add a base url to the TOC links for when your TOC is on another page than the actual content
+            * anchor_class (string) :   ''   - add custom class(es) for each anchor element
+
+        Output:
+            An ordered or unordered list representing the table of contents of a markdown block. This snippet will only
+            generate the table of contents and will NOT output the markdown given to it
+    {% endcomment %}
+
+    {% capture my_toc %}{% endcapture %}
+    {% assign orderedList = include.ordered | default: false %}
+    {% assign minHeader = include.h_min | default: 1 %}
+    {% assign maxHeader = include.h_max | default: 6 %}
+    {% assign nodes = include.html | split: '<h' %}
+    {% assign firstHeader = true %}
+
+    {% capture listModifier %}{% if orderedList %}1.{% else %}-{% endif %}{% endcapture %}
+
+    {% for node in nodes %}
+        {% if node == "" %}
+            {% continue %}
+        {% endif %}
+
+        {% assign headerLevel = node | replace: '"', '' | slice: 0, 1 | times: 1 %}
+
+        {% if headerLevel < minHeader or headerLevel > maxHeader %}
+            {% continue %}
+        {% endif %}
+
+        {% if firstHeader %}
+            {% assign firstHeader = false %}
+            {% assign minHeader = headerLevel %}
+        {% endif %}
+
+        {% assign indentAmount = headerLevel | minus: minHeader %}
+        {% assign _workspace = node | split: '</h' %}
+
+        {% assign _idWorkspace = _workspace[0] | split: 'id="' %}
+        {% assign _idWorkspace = _idWorkspace[1] | split: '"' %}
+        {% assign html_id = _idWorkspace[0] %}
+
+        {% assign _classWorkspace = _workspace[0] | split: 'class="' %}
+        {% assign _classWorkspace = _classWorkspace[1] | split: '"' %}
+        {% assign html_class = _classWorkspace[0] %}
+
+        {% if html_class contains "no_toc" %}
+            {% continue %}
+        {% endif %}
+
+        {% capture _hAttrToStrip %}{{ _workspace[0] | split: '>' | first }}>{% endcapture %}
+        {% assign header = _workspace[0] | replace: _hAttrToStrip, '' %}
+
+        {% assign space = '' %}
+        {% for i in (1..indentAmount) %}
+            {% assign space = space | prepend: '    ' %}
+        {% endfor %}
+
+        {% unless include.item_class == blank %}
+            {% capture listItemClass %}{:.{{ include.item_class | replace: '%level%', headerLevel }}}{% endcapture %}
+        {% endunless %}
+
+        {% capture heading_body %}{% if include.sanitize %}{{ header | strip_html }}{% else %}{{ header }}{% endif %}{% endcapture %}
+        {% capture my_toc %}{{ my_toc }}
+{{ space }}{{ listModifier }} {{ listItemClass }} [{{ heading_body | replace: "|", "\|" }}]({% if include.baseurl %}{{ include.baseurl }}{% endif %}#{{ html_id }}){% if include.anchor_class %}{:.{{ include.anchor_class }}}{% endif %}{% endcapture %}
+    {% endfor %}
+
+    {% if include.class %}
+        {% capture my_toc %}{:.{{ include.class }}}
+{{ my_toc | lstrip }}{% endcapture %}
+    {% endif %}
+
+    {% if include.id %}
+        {% capture my_toc %}{: #{{ include.id }}}
+{{ my_toc | lstrip }}{% endcapture %}
+    {% endif %}
+{% endcapture %}{% assign tocWorkspace = '' %}{{ my_toc | markdownify | strip }}
diff --git a/docs/_includes/video b/docs/_includes/video
new file mode 100644
index 000000000000..d653fd641df6
--- /dev/null
+++ b/docs/_includes/video
@@ -0,0 +1,24 @@
+{% capture video_id %}{{ include.id }}{% endcapture %}
+{% capture video_provider %}{{ include.provider }}{% endcapture %}
+{% capture video_danmaku %}{{ include.danmaku | default: 0 }}{% endcapture %}
+
+{% capture video_src %}
+  {% case video_provider %}
+  {% when "vimeo" %}
+    https://player.vimeo.com/video/{{ video_id }}?dnt=true
+  {% when "youtube" %}
+    https://www.youtube-nocookie.com/embed/{{ video_id }}
+  {% when "google-drive" %}
+    https://drive.google.com/file/d/{{ video_id }}/preview
+  {% when "bilibili" %}
+    https://player.bilibili.com/player.html?bvid={{ video_id }}&page=1&as_wide=1&high_quality=1&danmaku={{ video_danmaku }}
+  {% endcase %}
+{% endcapture %}
+{% assign video_src = video_src | strip %}
+
+<!-- Courtesy of embedresponsively.com //-->
+{% unless video_src == "" %}
+  <div class="responsive-video-container">
+    <iframe src="{{ video_src }}" frameborder="0" webkitAllowFullScreen mozallowfullscreen allowfullscreen></iframe>
+  </div>
+{% endunless %}
diff --git a/docs/_layouts/feed.html b/docs/_layouts/feed.html
deleted file mode 100644
index 83b137b6908e..000000000000
--- a/docs/_layouts/feed.html
+++ /dev/null
@@ -1,22 +0,0 @@
-<?xml version="1.0" encoding="utf-8"?>
-<feed xmlns="http://www.w3.org/2005/Atom">
-  <title>{{ site.title }}</title>
-  <link href="{{ '/atom.xml' | relative_url }}" rel="self" />
-  <link href="{{ site.url }}{{ site.baseurl }}/" />
-  <updated>{{ site.time | date_to_xmlschema }}</updated>
-  <id>{{ site.url }}</id>
-  <author>
-    <name>{{ site.author.name }}</name>
-    <email>{{ site.author.email }}</email>
-  </author>
-
-  {% for post in site.posts %} {% if post.tags contains page.tag-name %}
-  <entry>
-    <title>{{ post.title | xml_escape }}</title>
-    <link href="{{ site.url }}{{ site.baseurl }}{{ post.url }}" />
-    <updated>{{ post.date | date_to_xmlschema }}</updated>
-    <id>{{ site.url }}{{ post.id }}</id>
-    <content type="html">{{ post.content | xml_escape }}</content>
-  </entry>
-  {% endif %} {% endfor %}
-</feed>
diff --git a/docs/_layouts/news-home.html b/docs/_layouts/news-home.html
deleted file mode 100644
index 0ebdf0ea609f..000000000000
--- a/docs/_layouts/news-home.html
+++ /dev/null
@@ -1,67 +0,0 @@
----
-layout: archive
----
-
-{{ content }}
-
-
-{% if paginator %}
-  {% assign posts = paginator.posts %}
-{% else %}
-  {% assign posts = site.posts %}
-{% endif %}
-
-<div class="button-group filter-button-group justify-content-center">
-  <a class="btn btn-sm btn-primary" data-filter=".training">Training</a>
-  <a class="btn btn-sm btn-primary" data-filter=".inference">Inference</a>
-  <a class="btn btn-sm btn-primary active" data-filter="*">All</a>
-</div>
-
-<div class="grid">
-  {% for post in site.posts %}
-     <div class="col-md-4 col-sm-6 post-item {{ post.tags }}">
-        <a class="post-link" data-toggle="modal" href="#p{{ forloop.index }}">
-          <img class="img-fluid" src="{{ post.caption.thumbnail }}" alt="">
-        </a>
-     </div>
-  {% endfor %}
-</div>
-
-<script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha256-cCueBR6CsyA4/9szpPfrX3s49M9vUU5BgtiJj06wt/s=" crossorigin="anonymous"></script>
-<script src="https://unpkg.com/isotope-layout@3.0/dist/isotope.pkgd.js"></script>
-<script src="https://unpkg.com/imagesloaded@4/imagesloaded.pkgd.min.js"></script>
-
-<script>
-  var $grid = $('.grid').imagesLoaded( function() {
-      $grid.isotope({});
-  });
-  $('.filter-button-group').on( 'click', 'a', function() {
-      var filterValue = $(this).attr('data-filter');
-      $grid.isotope({ filter: filterValue });
-   });
-   $('.button-group a.btn').on('click', function(){
-      $('.button-group a.btn').removeClass('active');
-      $(this).addClass('active');
-   });
-</script>
-
-<!--
-<h2>{{ site.data.ui-text[site.locale].recent_posts | default: "Recent Posts" }}</h2>
-{% assign news = posts | where: "sneak_preview", "false" %}
-{% for post in news %}
-  {% include archive-single.html %}
-  {% if post.image %}
-    <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
-  {% endif %}
-{% endfor %}
-
-{% include paginator.html %} -->
-
-<!-- {% for tag in site.tags %}
-  <h3>{{ tag[0] }}</h3>
-  <ul>
-    {% for post in tag[1] %}
-      <li><a href="{{ post.url }}">{{ post.title }}</a></li>
-    {% endfor %}
-  </ul>
-{% endfor %} -->
diff --git a/docs/_layouts/single-full.html b/docs/_layouts/single-full.html
new file mode 100644
index 000000000000..8dce93ad491b
--- /dev/null
+++ b/docs/_layouts/single-full.html
@@ -0,0 +1,82 @@
+---
+layout: default
+---
+
+{% if page.header.overlay_color or page.header.overlay_image or page.header.image %}
+  {% include page__hero.html %}
+{% elsif page.header.video.id and page.header.video.provider %}
+  {% include page__hero_video.html %}
+{% endif %}
+
+<div id="main" role="main">
+
+  <article class="page" itemscope itemtype="https://schema.org/CreativeWork">
+    {% if page.title %}<meta itemprop="headline" content="{{ page.title | markdownify | strip_html | strip_newlines | escape_once }}">{% endif %}
+    {% if page.excerpt %}<meta itemprop="description" content="{{ page.excerpt | markdownify | strip_html | strip_newlines | escape_once }}">{% endif %}
+    {% if page.date %}<meta itemprop="datePublished" content="{{ page.date | date_to_xmlschema }}">{% endif %}
+    {% if page.last_modified_at %}<meta itemprop="dateModified" content="{{ page.last_modified_at | date_to_xmlschema }}">{% endif %}
+
+    <div class="page__inner-wrap">
+      {% unless page.header.overlay_color or page.header.overlay_image %}
+        <header>
+          {% if page.title %}<h1 id="page-title" class="page__title" itemprop="headline">{{ page.title | markdownify | remove: "<p>" | remove: "</p>" }}</h1>{% endif %}
+          {% include page__meta.html %}
+        </header>
+      {% endunless %}
+
+      <section class="page__content" itemprop="text">
+        {% if page.toc %}
+          <aside class="sidebar__right {% if page.toc_sticky %}sticky{% endif %}">
+            <nav class="toc">
+              <header><h4 class="nav__title"><i class="fas fa-{{ page.toc_icon | default: 'file-alt' }}"></i> {{ page.toc_label | default: site.data.ui-text[site.locale].toc_label | default: "On this page" }}</h4></header>
+              {% include toc.html sanitize=true html=content h_min=1 h_max=6 class="toc__menu" %}
+            </nav>
+          </aside>
+        {% endif %}
+        {{ content }}
+        {% if page.link %}<div><a href="{{ page.link }}" class="btn btn--primary">{{ site.data.ui-text[site.locale].ext_link_label | default: "Direct Link" }}</a></div>{% endif %}
+      </section>
+
+      <footer class="page__meta">
+        {% if site.data.ui-text[site.locale].meta_label %}
+          <h4 class="page__meta-title">{{ site.data.ui-text[site.locale].meta_label }}</h4>
+        {% endif %}
+        {% include page__taxonomy.html %}
+        {% include page__date.html %}
+      </footer>
+
+      {% if page.share %}{% include social-share.html %}{% endif %}
+
+      {% include post_pagination.html %}
+    </div>
+
+    {% if jekyll.environment == 'production' and site.comments.provider and page.comments %}
+      {% include comments.html %}
+    {% endif %}
+  </article>
+
+  {% comment %}<!-- only show related on a post page when `related: true` -->{% endcomment %}
+  {% if page.id and page.related and site.related_posts.size > 0 %}
+    <div class="page__related">
+      <h4 class="page__related-title">{{ site.data.ui-text[site.locale].related_label | default: "You May Also Enjoy" }}</h4>
+      <div class="grid__wrapper">
+        {% for post in site.related_posts limit:4 %}
+          {% include archive-single.html type="grid" %}
+        {% endfor %}
+      </div>
+    </div>
+  {% comment %}<!-- otherwise show recent posts if no related when `related: true` -->{% endcomment %}
+  {% elsif page.id and page.related %}
+    <div class="page__related">
+      <h4 class="page__related-title">{{ site.data.ui-text[site.locale].related_label | default: "You May Also Enjoy" }}</h4>
+      <div class="grid__wrapper">
+        {% for post in site.posts limit:4 %}
+          {% if post.id == page.id %}
+            {% continue %}
+          {% endif %}
+          {% include archive-single.html type="grid" %}
+        {% endfor %}
+      </div>
+    </div>
+  {% endif %}
+</div>
diff --git a/docs/_layouts/tags.html b/docs/_layouts/tags.html
deleted file mode 100644
index 43f34f6771f4..000000000000
--- a/docs/_layouts/tags.html
+++ /dev/null
@@ -1,16 +0,0 @@
----
-layout: default
----
-
-<div>
-  <h1>Articles tagged with ""</h1>
-  <ul style='padding-top: 16px;'>
-
-  {% for post in site.posts %}
-    {% if post.tags contains page.tag-name %}
-      <li><a href="{{ post.url }}">{{ post.title }}</a>, published {{ post.date | date: "%Y-%m-%d" }}</li>
-    {% endif %}
-  {% endfor %}
-
-  </ul>
-</div>
diff --git a/docs/_posts/2020-02-13-release.md b/docs/_posts/2020-02-13-release.md
index d8482de7288b..50581ca0c102 100644
--- a/docs/_posts/2020-02-13-release.md
+++ b/docs/_posts/2020-02-13-release.md
@@ -1,8 +1,7 @@
 ---
-layout: single
 title: "ZeRO & DeepSpeed: New system optimizations enable training models with over 100 billion parameters"
 date:   2020-02-13
 link: https://www.microsoft.com/en-us/research/blog/zero-deepspeed-new-system-optimizations-enable-training-models-with-over-100-billion-parameters/
 excerpt: "Developed by Microsoft AI & Research."
-categories: training zero
+tags: training zero
 ---
diff --git a/docs/_posts/2020-02-13-turing-nlg.md b/docs/_posts/2020-02-13-turing-nlg.md
index cb9ee59e314f..0da59aa8fee3 100644
--- a/docs/_posts/2020-02-13-turing-nlg.md
+++ b/docs/_posts/2020-02-13-turing-nlg.md
@@ -1,8 +1,7 @@
 ---
-layout: single
 title: "Turing-NLG: A 17-billion-parameter language model by Microsoft"
 date:   2020-02-13
 link: https://www.microsoft.com/en-us/research/blog/turing-nlg-a-17-billion-parameter-language-model-by-microsoft/
 excerpt: "DeepSpeed was used to train the world's largest language model."
-categories: training
+tags: training
 ---
diff --git a/docs/_posts/2020-05-19-bert-record.md b/docs/_posts/2020-05-19-bert-record.md
index ce2f58b231f1..47599a5a8aed 100644
--- a/docs/_posts/2020-05-19-bert-record.md
+++ b/docs/_posts/2020-05-19-bert-record.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "The Fastest and Most Efficient BERT Training through Optimized Transformer Kernels"
 excerpt: ""
-categories: training
-new_post: true
+tags: training
 date: 2020-05-19 00:00:00
 ---
 
diff --git a/docs/_posts/2020-05-19-press-release.md b/docs/_posts/2020-05-19-press-release.md
index b8e2dd09b02f..a4da131f06a1 100644
--- a/docs/_posts/2020-05-19-press-release.md
+++ b/docs/_posts/2020-05-19-press-release.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "ZeRO-2 & DeepSpeed: Shattering Barriers of Deep Learning Speed & Scale"
 excerpt: ""
 link: https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/
-categories: training zero
-new_post: false
+tags: training zero
 date: 2020-05-19 02:00:00
 ---
diff --git a/docs/_posts/2020-05-19-zero-stage2.md b/docs/_posts/2020-05-19-zero-stage2.md
index 39504032d2ae..7c5a1e912a17 100644
--- a/docs/_posts/2020-05-19-zero-stage2.md
+++ b/docs/_posts/2020-05-19-zero-stage2.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "An Order-of-Magnitude Larger and Faster Training with ZeRO-2"
 excerpt: ""
-categories: training zero
-new_post: false
+tags: training zero
 date: 2020-05-19 01:00:00
 ---
 
diff --git a/docs/_posts/2020-05-28-fastest-bert-training.md b/docs/_posts/2020-05-28-fastest-bert-training.md
index 1eaf6afc4f1b..99d132c1e53d 100644
--- a/docs/_posts/2020-05-28-fastest-bert-training.md
+++ b/docs/_posts/2020-05-28-fastest-bert-training.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "Microsoft DeepSpeed achieves the fastest BERT training time"
 excerpt: ""
-categories: training
-new_post: false
+tags: training
 date: 2020-05-28 00:00:00
 ---
 
diff --git a/docs/_posts/2020-07-24-deepspeed-webinar.md b/docs/_posts/2020-07-24-deepspeed-webinar.md
index 58f3674845e3..be4ee777ed61 100644
--- a/docs/_posts/2020-07-24-deepspeed-webinar.md
+++ b/docs/_posts/2020-07-24-deepspeed-webinar.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "DeepSpeed Microsoft Research Webinar on August 6th, 2020"
 excerpt: ""
-categories: presentations
+tags: presentations
 link: https://note.microsoft.com/MSR-Webinar-DeepSpeed-Registration-On-Demand.html
 image: /assets/images/webinar-aug2020.png
-new_post: true
 date: 2020-07-24 00:00:00
 ---
diff --git a/docs/_posts/2020-08-07-webinar-on-demand.md b/docs/_posts/2020-08-07-webinar-on-demand.md
index 3173df1f7881..983e17eca36b 100644
--- a/docs/_posts/2020-08-07-webinar-on-demand.md
+++ b/docs/_posts/2020-08-07-webinar-on-demand.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "DeepSpeed Microsoft Research Webinar is now on-demand"
 excerpt: ""
-categories: presentations
+tags: presentations
 link: https://note.microsoft.com/MSR-Webinar-DeepSpeed-Registration-On-Demand.html
-new_post: true
 date: 2020-08-07 00:00:00
 ---
diff --git a/docs/_posts/2020-09-08-sparse-attention-news.md b/docs/_posts/2020-09-08-sparse-attention-news.md
index 3d5c4cdcb5f9..2ae615c45c82 100644
--- a/docs/_posts/2020-09-08-sparse-attention-news.md
+++ b/docs/_posts/2020-09-08-sparse-attention-news.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "Powering 10x longer sequences and 6x faster execution through DeepSpeed Sparse Attention"
 excerpt: ""
-categories: training
-new_post: true
+tags: training
 date: 2020-09-09 00:00:00
 ---
 
diff --git a/docs/_posts/2020-09-09-ZeRO-Offload.md b/docs/_posts/2020-09-09-ZeRO-Offload.md
index 749683b25ec9..353b8b50f701 100755
--- a/docs/_posts/2020-09-09-ZeRO-Offload.md
+++ b/docs/_posts/2020-09-09-ZeRO-Offload.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "10x bigger model training on a single GPU with ZeRO-Offload"
 excerpt: ""
-new_post: true
 date: 2020-09-09 00:00:00
-categories: training zero
+tags: training zero
 ---
 
 We introduce a new technology called ZeRO-Offload to enable **10X bigger model training on a single GPU**. ZeRO-Offload extends ZeRO-2 to leverage both CPU and GPU memory for training large models. Using a machine with **a single GPU**, our users now can run **models of up to 13 billion parameters** without running out of memory, 10x bigger than the existing approaches, while obtaining competitive throughput. This feature democratizes multi-billion-parameter model training and opens the window for many deep learning practitioners to explore bigger and better models.
diff --git a/docs/_posts/2020-09-09-onebit-adam-blog-post.md b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
index ffe0f69f317f..ee25a73efa1c 100644
--- a/docs/_posts/2020-09-09-onebit-adam-blog-post.md
+++ b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "DeepSpeed with 1-bit Adam: 5x less communication and 3.4x faster training"
 excerpt: ""
-new_post: false
 date: 2020-09-09 00:00:00
-categories: training communication
+tags: training communication
 ---
 
 ## 1. Introduction
diff --git a/docs/_posts/2020-09-09-onebit-adam-news.md b/docs/_posts/2020-09-09-onebit-adam-news.md
index 109631251962..19253ac76b00 100644
--- a/docs/_posts/2020-09-09-onebit-adam-news.md
+++ b/docs/_posts/2020-09-09-onebit-adam-news.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "Up to 5x less communication and 3.4x faster training through 1-bit Adam"
 excerpt: ""
-new_post: true
 date: 2020-09-09 00:00:00
-categories: training communication
+tags: training communication
 ---
 
 
diff --git a/docs/_posts/2020-09-09-pipeline-parallelism.md b/docs/_posts/2020-09-09-pipeline-parallelism.md
index af537ffcd62c..4f2e53ed80ee 100644
--- a/docs/_posts/2020-09-09-pipeline-parallelism.md
+++ b/docs/_posts/2020-09-09-pipeline-parallelism.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "Training a Trillion Parameters with Pipeline Parallelism"
 excerpt: ""
-new_post: true
 date: 2020-09-09 00:00:00
-categories: training
+tags: training
 ---
 
 DeepSpeed includes new support for pipeline parallelism! DeepSpeed's training
diff --git a/docs/_posts/2020-09-09-sparse-attention.md b/docs/_posts/2020-09-09-sparse-attention.md
index 40fdfb449ef1..aa0fa0bb60d4 100644
--- a/docs/_posts/2020-09-09-sparse-attention.md
+++ b/docs/_posts/2020-09-09-sparse-attention.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "DeepSpeed Sparse Attention"
 excerpt: ""
-new_post: true
 date: 2020-09-09 01:00:00
-categories: training inference
+tags: training inference
 ---
 
 Attention-based deep learning models such as the transformers are highly effective in capturing relationship between tokens in an input sequence, even across long distances. As a result, they are used with text, image, and sound-based inputs, where the sequence length can be in thousands of tokens. However, despite the effectiveness of attention modules to capture long term dependencies, in practice, their application to long sequence input is limited by compute and memory requirements of the attention computation that grow quadratically, `O(n^2)`, with the sequence length `n`.
diff --git a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
index 53a995da93b6..b55d1cb7d8cf 100755
--- a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
+++ b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "Progressive Layer Dropping"
 excerpt: ""
-new_post: true
 date: 2020-10-29 00:00:00
-categories: training
+tags: training
 ---
 
 We introduce a new technology called progressive layer dropping (PLD) to speedup the pre-training of Transformer-based networks through efficient and robust compressed training. The pre-training step of Transformer networks often suffer from unbearable overall computational expenses. We analyze the training dynamics and stability of Transformer networks and propose PLD to sparsely update Transformer blocks following a progressive dropping schedule, which smoothly increases the layer dropping rate for each mini-batch as training evolves along both the temporal and the model depth dimension. PLD is able to allow the pre-training to be **2.5X faster** to get similar accuracy on downstream tasks and allows the training to be **24% faster** when training the same number of samples, not at the cost of excessive hardware resources.
diff --git a/docs/_posts/2021-03-08-zero3-offload.md b/docs/_posts/2021-03-08-zero3-offload.md
index ea394e46fc37..2ce5ef919a0d 100644
--- a/docs/_posts/2021-03-08-zero3-offload.md
+++ b/docs/_posts/2021-03-08-zero3-offload.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "DeepSpeed ZeRO-3 Offload"
 excerpt: ""
-new_post: true
 date: 2021-03-08 00:00:00
-categories: training zero
+tags: training zero
 ---
 Today we are announcing the release of ZeRO-3 Offload, a highly efficient and easy to use implementation of ZeRO Stage 3 and ZeRO Offload combined, geared towards our continued goal of democratizing AI by making efficient large-scale DL training available to everyone.  The key benefits of ZeRO-3 Offload are:
 
diff --git a/docs/_posts/2021-05-05-MoQ.md b/docs/_posts/2021-05-05-MoQ.md
index 8e2255293dbe..e6f7872a4007 100644
--- a/docs/_posts/2021-05-05-MoQ.md
+++ b/docs/_posts/2021-05-05-MoQ.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "Mixture-of-Quantization: A novel quantization approach for reducing model size with minimal accuracy impact"
 excerpt: ""
-new_post: false
 date: 2021-05-05 00:00:00
-categories: inference
+tags: inference
 ---
 
 ## A unified suite for quantization-aware training and inference
diff --git a/docs/_posts/2021-05-05-inference-kernel-optimization.md b/docs/_posts/2021-05-05-inference-kernel-optimization.md
index 933e00fa7449..63e3ac669e22 100644
--- a/docs/_posts/2021-05-05-inference-kernel-optimization.md
+++ b/docs/_posts/2021-05-05-inference-kernel-optimization.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "DeepSpeed Inference: Multi-GPU inference with customized inference kernels and quantization support"
 excerpt: ""
-new_post: false
 date: 2021-03-16 00:00:00
-categories: inference
+tags: inference
 ---
 While DeepSpeed supports training advanced large-scale models, using these trained models in the desired application scenarios is still challenging due to three major limitations in existing inference solutions: 1) lack of support for multi-GPU inference to fit large models and meet latency requirements, 2) limited GPU kernel performance when running inference with small batch sizes, and 3) difficulties in exploiting quantization, which includes both quantizing the model to reduce the model size and latency as well as supporting high-performance inference of quantized models without specialized hardware.
 
diff --git a/docs/_posts/2021-05-14-inference-release.md b/docs/_posts/2021-05-14-inference-release.md
index 2f6755d3679d..94e69503c40c 100644
--- a/docs/_posts/2021-05-14-inference-release.md
+++ b/docs/_posts/2021-05-14-inference-release.md
@@ -1,8 +1,7 @@
 ---
-layout: single
 title: "DeepSpeed: Accelerating large-scale model inference and training via system optimizations and compression"
 date:   2021-05-14
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-accelerating-large-scale-model-inference-and-training-via-system-optimizations-and-compression/
 excerpt: "Developed by Microsoft AI & Research."
-categories: inference
+tags: inference
 ---
diff --git a/docs/_posts/2021-08-18-deepspeed-moe.md b/docs/_posts/2021-08-18-deepspeed-moe.md
index 86e27ff2edb7..5bd9667f2a7f 100644
--- a/docs/_posts/2021-08-18-deepspeed-moe.md
+++ b/docs/_posts/2021-08-18-deepspeed-moe.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "DeepSpeed powers 8x larger MoE model training with high performance"
 excerpt: ""
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-powers-8x-larger-moe-model-training-with-high-performance/
-new_post: true
 date: 2021-08-18 00:00:00
-categories: training
+tags: training
 ---
diff --git a/docs/_posts/2021-11-15-autotuning.md b/docs/_posts/2021-11-15-autotuning.md
index 509f691e57f1..650f099ecb29 100644
--- a/docs/_posts/2021-11-15-autotuning.md
+++ b/docs/_posts/2021-11-15-autotuning.md
@@ -1,10 +1,8 @@
 ---
-layout: single
 title: "Autotuning: Automatically discover the optimal DeepSpeed configuration that delivers good training speed"
 excerpt: ""
-new_post: true
-date: 2021-11-16 00:00:00
-categories: training
+date: 2021-11-16 10:00:00
+tags: training
 ---
 
 We introduce a new feature called Autotuning to automatically discover the optimal DeepSpeed configuration that delivers good training speed. One pain point in model training is to figure out good performance-relevant configurations such as micro-batch size to fully utilize the hardware and achieve a high throughput number. This configuration exploring process is commonly done manually but is important since model training is repeated many times and benefits from using a good configuration. Not only is the hand-tuning process time-consuming, but the outcome is hardware-dependent. This means that a good configuration on one hardware might not be the best on another different hardware. The user thus has to hand tune the configuration again. With DeepSpeed, there are more configuration parameters that could potentially affect the training speed, thus making it more tedious to manually tune the configuration.
diff --git a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
index 2e2b19c9cc2e..99bc86cbd5d2 100644
--- a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
+++ b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
@@ -1,14 +1,10 @@
 ---
-layout: single
 title: "DeepSpeed-MoE for NLG: Reducing the training cost of language models by 5 times"
 excerpt: ""
-new_post: false
 date: 2021-12-09 22:00:00
-categories: training
+tags: training
 ---
 
-Published on December 9, 2021
-
 [By DeepSpeed Team](https://www.microsoft.com/en-us/research/project/deepspeed/people/)
 
 Autoregressive transformer-based natural language generation (referred to as
diff --git a/docs/_posts/2022-01-19-moe-inference.md b/docs/_posts/2022-01-19-moe-inference.md
index 3cfab04b96cc..f2ac1c6de2e1 100644
--- a/docs/_posts/2022-01-19-moe-inference.md
+++ b/docs/_posts/2022-01-19-moe-inference.md
@@ -1,9 +1,7 @@
 ---
-layout: single
 title: "DeepSpeed: Advancing MoE inference and training to power next-generation AI scale"
 excerpt: ""
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-advancing-moe-inference-and-training-to-power-next-generation-ai-scale/
-new_post: true
 date: 2022-01-19 00:00:00
-categories: inference
+tags: inference
 ---
diff --git a/docs/_sass/minimal-mistakes.scss b/docs/_sass/minimal-mistakes.scss
new file mode 100644
index 000000000000..7f25575784dd
--- /dev/null
+++ b/docs/_sass/minimal-mistakes.scss
@@ -0,0 +1,65 @@
+/*!
+ * Minimal Mistakes Jekyll Theme 4.20.2 by Michael Rose
+ * Copyright 2013-2020 Michael Rose - mademistakes.com | @mmistakes
+ * Licensed under MIT (https://github.com/mmistakes/minimal-mistakes/blob/master/LICENSE)
+*/
+
+/* Variables */
+@import "minimal-mistakes/variables";
+
+/* Mixins and functions */
+@import "minimal-mistakes/vendor/breakpoint/breakpoint";
+@include breakpoint-set("to ems", true);
+@import "minimal-mistakes/vendor/magnific-popup/magnific-popup"; // Magnific Popup
+@import "minimal-mistakes/vendor/susy/susy";
+@import "minimal-mistakes/mixins";
+
+/* Core CSS */
+@import "minimal-mistakes/reset";
+@import "minimal-mistakes/base";
+@import "minimal-mistakes/forms";
+@import "minimal-mistakes/tables";
+@import "minimal-mistakes/animations";
+
+/* Components */
+@import "minimal-mistakes/buttons";
+@import "minimal-mistakes/notices";
+@import "minimal-mistakes/masthead";
+@import "minimal-mistakes/navigation";
+@import "minimal-mistakes/footer";
+@import "minimal-mistakes/search";
+@import "minimal-mistakes/syntax";
+
+/* Utility classes */
+@import "minimal-mistakes/utilities";
+
+/* Layout specific */
+@import "minimal-mistakes/page";
+@import "minimal-mistakes/archive";
+@import "minimal-mistakes/sidebar";
+@import "minimal-mistakes/print";
+
+
+.wide2 {
+    .page {
+      float: left;
+      width: 115%;
+      @include breakpoint($large) {
+        padding-left: 15%;
+      }
+
+      @include breakpoint($x-large) {
+        padding-left: 15%;
+      }
+    }
+
+    .page__related {
+      @include breakpoint($large) {
+        padding-left: 15%;
+      }
+
+      @include breakpoint($x-large) {
+        padding-left: 15%;
+      }
+    }
+  }
diff --git a/docs/assets/css/main.scss b/docs/assets/css/main.scss
index 26a771784d01..4f31bd44dd40 100644
--- a/docs/assets/css/main.scss
+++ b/docs/assets/css/main.scss
@@ -45,3 +45,67 @@
     @include yiq-contrasted($active-color);
   }
 }
+
+/* CSS */
+.button-15 {
+  background-image: linear-gradient(#42A1EC, #0070C9);
+  border: 1px solid #0077CC;
+  border-radius: 4px;
+  box-sizing: border-box;
+  color: #FFFFFF;
+  cursor: pointer;
+  direction: ltr;
+  display: block;
+  font-family: "SF Pro Text","SF Pro Icons","AOS Icons","Helvetica Neue",Helvetica,Arial,sans-serif;
+  font-size: 17px;
+  font-weight: 400;
+  letter-spacing: -.022em;
+  line-height: 1.47059;
+  min-width: 30px;
+  overflow: visible;
+  padding: 4px 15px;
+  text-align: center;
+  vertical-align: baseline;
+  user-select: none;
+  -webkit-user-select: none;
+  touch-action: manipulation;
+  white-space: nowrap;
+}
+
+.button-15:disabled {
+  cursor: default;
+  opacity: .3;
+}
+
+.button-15:hover {
+  background-image: linear-gradient(#51A9EE, #147BCD);
+  border-color: #1482D0;
+  text-decoration: none;
+}
+
+.button-15:active {
+  background-image: linear-gradient(#3D94D9, #0067B9);
+  border-color: #006DBC;
+  outline: none;
+}
+
+.button-15:focus {
+  box-shadow: rgba(131, 192, 253, 0.5) 0 0 0 3px;
+  outline: none;
+}
+
+ul.tag-box li {
+  display: inline-block;
+  list-style: none;
+  list-style-image: none;
+  margin-bottom: 7px;
+}
+ul.tag-box li a {
+  background: #e6e6e6;
+  padding: 4px 8px;
+  border-radius: 3px;
+  color: #f76b48;
+}
+ul.tag-box li span.size {
+  font-weight: 300;
+}
\ No newline at end of file
diff --git a/docs/news/index.html b/docs/news/index.html
deleted file mode 100644
index 6cfe0b7a14c1..000000000000
--- a/docs/news/index.html
+++ /dev/null
@@ -1,3 +0,0 @@
----
-layout: news
----
diff --git a/docs/_layouts/news.html b/docs/tags.md
similarity index 63%
rename from docs/_layouts/news.html
rename to docs/tags.md
index d0d5f82787ac..54c3f9c3cf69 100644
--- a/docs/_layouts/news.html
+++ b/docs/tags.md
@@ -1,7 +1,6 @@
 ---
 layout: archive
-post-content:
-backsite: javascript:history.back()
+permalink: /posts/
 ---
 
 {% if paginator %}
@@ -13,8 +12,8 @@
 <script type="text/javascript">
     function filterUsingCategory(selectedCategory) {
       var id = 0;
-      {% for post in site.posts %}
-        var cats = {{ post.categories | jsonify }}
+      {% for post in posts %}
+        var cats = {{ post.tags | jsonify }}
 
         var postDiv = document.getElementById(++id);
         postDiv.style.display = (selectedCategory == 'All' || cats.includes(selectedCategory))
@@ -26,8 +25,8 @@
 
   <div>
     <button id="All" onclick="filterUsingCategory('All')">*Show All Posts*</button>
-    {% assign categories = site.categories | sort %}
-    {% for category in categories %}
+    {% assign tags = site.tags | sort %}
+    {% for category in tags %}
       {% assign cat = category | first %}
       <button id="{{ cat }}" onclick="filterUsingCategory(this.id)">{{ cat }}</button>
     {% endfor %}
@@ -36,17 +35,20 @@
 
   <div class="posts-wrapper">
     {% assign id = 0 %}
-    {% for post in site.posts %}
+    {% for post in posts %}
       {% assign id = id | plus:1 %}
       <div class="post" id="{{id}}">
         <p class="itemInteriorSection">
-          <a href="{{post.url}}">{{ post.articletitle }}</a><br />
-            <span><b>&middot;</b></span>
-            {% include archive-single.html %}
-            {% if post.image %}
-              <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
-            {% endif %}
+          <a href="{{post.url}}">{{ post.articletitle }}</a>
+            {%- unless post.hidden -%}
+              {% include archive-single.html %}
+              {% if post.image %}
+                <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
+              {% endif %}
+            {%- endunless -%}
         </p>
       </div>
     {% endfor %}
-  </div>
\ No newline at end of file
+  </div>
+
+
diff --git a/docs/tags_list.md b/docs/tags_list.md
new file mode 100644
index 000000000000..c56491ae1550
--- /dev/null
+++ b/docs/tags_list.md
@@ -0,0 +1,29 @@
+---
+layout: archive
+permalink: /tags/
+---
+
+{% assign sorted_tags = (site.tags | sort:0) %}
+<ul class="tag-box">
+	{% for tag in sorted_tags %}
+		{% assign t = tag | first %}
+		{% assign posts = tag | last %}
+		<li><a href="#{{ t | downcase }}">{{ t }} <span class="size">({{ posts.size }})</span></a></li>
+	{% endfor %}
+</ul>
+
+{% for tag in sorted_tags %}
+  {% assign t = tag | first %}
+  {% assign posts = tag | last %}
+
+<h4 id="{{ t | downcase }}">{{ t }}</h4>
+<ul>
+{% for post in posts %}
+  {% if post.tags contains t %}
+    <li>
+       <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.url }}">{{ post.title }}</a>
+    </li>
+  {% endif %}
+{% endfor %}
+</ul>
+{% endfor %}

From ca0f351da67120ea9ccac13de2f368bc342d4dbb Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Mon, 28 Feb 2022 23:37:19 +0500
Subject: [PATCH 05/20] add tagging presentations

---
 docs/Gemfile.lock                             | 179 ++++++++++--------
 docs/_data/navigation.yml                     |   2 +-
 .../2020-09-09-onebit-adam-blog-post.md       |   2 +-
 docs/_posts/2020-09-09-onebit-adam-news.md    |   2 +-
 docs/_sass/button-group.scss                  |  68 +++++++
 docs/assets/css/main.scss                     |  62 +-----
 docs/tags.md                                  |   8 +-
 docs/tags_list.md                             |   2 +
 8 files changed, 186 insertions(+), 139 deletions(-)
 create mode 100644 docs/_sass/button-group.scss

diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
index 062c854af7da..de784eb2f388 100644
--- a/docs/Gemfile.lock
+++ b/docs/Gemfile.lock
@@ -1,7 +1,7 @@
 GEM
   remote: https://rubygems.org/
   specs:
-    activesupport (6.0.3.4)
+    activesupport (6.0.4.6)
       concurrent-ruby (~> 1.0, >= 1.0.2)
       i18n (>= 0.7, < 2)
       minitest (~> 5.1)
@@ -16,24 +16,44 @@ GEM
     colorator (1.1.0)
     commonmarker (0.17.13)
       ruby-enum (~> 0.5)
-    concurrent-ruby (1.1.7)
-    dnsruby (1.61.4)
+    concurrent-ruby (1.1.9)
+    dnsruby (1.61.9)
       simpleidn (~> 0.1)
-    em-websocket (0.5.2)
+    em-websocket (0.5.3)
       eventmachine (>= 0.12.9)
-      http_parser.rb (~> 0.6.0)
-    ethon (0.12.0)
-      ffi (>= 1.3.0)
+      http_parser.rb (~> 0)
+    ethon (0.15.0)
+      ffi (>= 1.15.0)
     eventmachine (1.2.7)
-    execjs (2.7.0)
-    faraday (1.1.0)
+    execjs (2.8.1)
+    faraday (1.10.0)
+      faraday-em_http (~> 1.0)
+      faraday-em_synchrony (~> 1.0)
+      faraday-excon (~> 1.1)
+      faraday-httpclient (~> 1.0)
+      faraday-multipart (~> 1.0)
+      faraday-net_http (~> 1.0)
+      faraday-net_http_persistent (~> 1.0)
+      faraday-patron (~> 1.0)
+      faraday-rack (~> 1.0)
+      faraday-retry (~> 1.0)
+      ruby2_keywords (>= 0.0.4)
+    faraday-em_http (1.0.0)
+    faraday-em_synchrony (1.0.0)
+    faraday-excon (1.1.0)
+    faraday-httpclient (1.0.1)
+    faraday-multipart (1.0.3)
       multipart-post (>= 1.2, < 3)
-      ruby2_keywords
-    ffi (1.13.1)
+    faraday-net_http (1.0.1)
+    faraday-net_http_persistent (1.2.0)
+    faraday-patron (1.0.0)
+    faraday-rack (1.0.0)
+    faraday-retry (1.0.3)
+    ffi (1.15.5)
     forwardable-extended (2.6.0)
     gemoji (3.0.1)
-    github-pages (209)
-      github-pages-health-check (= 1.16.1)
+    github-pages (223)
+      github-pages-health-check (= 1.17.9)
       jekyll (= 3.9.0)
       jekyll-avatar (= 0.7.0)
       jekyll-coffeescript (= 1.1.1)
@@ -42,30 +62,31 @@ GEM
       jekyll-feed (= 0.15.1)
       jekyll-gist (= 1.5.0)
       jekyll-github-metadata (= 2.13.0)
+      jekyll-include-cache (= 0.2.1)
       jekyll-mentions (= 1.6.0)
       jekyll-optional-front-matter (= 0.3.2)
       jekyll-paginate (= 1.1.0)
       jekyll-readme-index (= 0.3.0)
       jekyll-redirect-from (= 0.16.0)
       jekyll-relative-links (= 0.6.1)
-      jekyll-remote-theme (= 0.4.2)
+      jekyll-remote-theme (= 0.4.3)
       jekyll-sass-converter (= 1.5.2)
-      jekyll-seo-tag (= 2.6.1)
+      jekyll-seo-tag (= 2.7.1)
       jekyll-sitemap (= 1.4.0)
       jekyll-swiss (= 1.0.0)
-      jekyll-theme-architect (= 0.1.1)
-      jekyll-theme-cayman (= 0.1.1)
-      jekyll-theme-dinky (= 0.1.1)
-      jekyll-theme-hacker (= 0.1.2)
-      jekyll-theme-leap-day (= 0.1.1)
-      jekyll-theme-merlot (= 0.1.1)
-      jekyll-theme-midnight (= 0.1.1)
-      jekyll-theme-minimal (= 0.1.1)
-      jekyll-theme-modernist (= 0.1.1)
-      jekyll-theme-primer (= 0.5.4)
-      jekyll-theme-slate (= 0.1.1)
-      jekyll-theme-tactile (= 0.1.1)
-      jekyll-theme-time-machine (= 0.1.1)
+      jekyll-theme-architect (= 0.2.0)
+      jekyll-theme-cayman (= 0.2.0)
+      jekyll-theme-dinky (= 0.2.0)
+      jekyll-theme-hacker (= 0.2.0)
+      jekyll-theme-leap-day (= 0.2.0)
+      jekyll-theme-merlot (= 0.2.0)
+      jekyll-theme-midnight (= 0.2.0)
+      jekyll-theme-minimal (= 0.2.0)
+      jekyll-theme-modernist (= 0.2.0)
+      jekyll-theme-primer (= 0.6.0)
+      jekyll-theme-slate (= 0.2.0)
+      jekyll-theme-tactile (= 0.2.0)
+      jekyll-theme-time-machine (= 0.2.0)
       jekyll-titles-from-headings (= 0.5.3)
       jemoji (= 0.12.0)
       kramdown (= 2.3.1)
@@ -73,19 +94,19 @@ GEM
       liquid (= 4.0.3)
       mercenary (~> 0.3)
       minima (= 2.5.1)
-      nokogiri (>= 1.10.4, < 2.0)
-      rouge (= 3.23.0)
+      nokogiri (>= 1.12.5, < 2.0)
+      rouge (= 3.26.0)
       terminal-table (~> 1.4)
-    github-pages-health-check (1.16.1)
+    github-pages-health-check (1.17.9)
       addressable (~> 2.3)
       dnsruby (~> 1.60)
       octokit (~> 4.0)
-      public_suffix (~> 3.0)
+      public_suffix (>= 3.0, < 5.0)
       typhoeus (~> 1.3)
     html-pipeline (2.14.0)
       activesupport (>= 2)
       nokogiri (>= 1.4)
-    http_parser.rb (0.6.0)
+    http_parser.rb (0.8.0)
     i18n (0.9.5)
       concurrent-ruby (~> 1.0)
     jekyll (3.9.0)
@@ -136,57 +157,57 @@ GEM
       jekyll (>= 3.3, < 5.0)
     jekyll-relative-links (0.6.1)
       jekyll (>= 3.3, < 5.0)
-    jekyll-remote-theme (0.4.2)
+    jekyll-remote-theme (0.4.3)
       addressable (~> 2.0)
       jekyll (>= 3.5, < 5.0)
       jekyll-sass-converter (>= 1.0, <= 3.0.0, != 2.0.0)
       rubyzip (>= 1.3.0, < 3.0)
     jekyll-sass-converter (1.5.2)
       sass (~> 3.4)
-    jekyll-seo-tag (2.6.1)
-      jekyll (>= 3.3, < 5.0)
+    jekyll-seo-tag (2.7.1)
+      jekyll (>= 3.8, < 5.0)
     jekyll-sitemap (1.4.0)
       jekyll (>= 3.7, < 5.0)
     jekyll-swiss (1.0.0)
-    jekyll-theme-architect (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-architect (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-cayman (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-cayman (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-dinky (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-dinky (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-hacker (0.1.2)
+    jekyll-theme-hacker (0.2.0)
       jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-leap-day (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-leap-day (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-merlot (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-merlot (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-midnight (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-midnight (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-minimal (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-minimal (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-modernist (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-modernist (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-primer (0.5.4)
+    jekyll-theme-primer (0.6.0)
       jekyll (> 3.5, < 5.0)
       jekyll-github-metadata (~> 2.9)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-slate (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-slate (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-tactile (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-tactile (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-time-machine (0.1.1)
-      jekyll (~> 3.5)
+    jekyll-theme-time-machine (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
     jekyll-titles-from-headings (0.5.3)
       jekyll (>= 3.3, < 5.0)
@@ -201,11 +222,11 @@ GEM
     kramdown-parser-gfm (1.1.0)
       kramdown (~> 2.0)
     liquid (4.0.3)
-    listen (3.2.1)
+    listen (3.7.1)
       rb-fsevent (~> 0.10, >= 0.10.3)
       rb-inotify (~> 0.9, >= 0.9.10)
     mercenary (0.3.6)
-    mini_portile2 (2.6.1)
+    mini_portile2 (2.8.0)
     minima (2.5.1)
       jekyll (>= 3.5, < 5.0)
       jekyll-feed (~> 0.9)
@@ -217,27 +238,27 @@ GEM
       jekyll-include-cache (~> 0.1)
       jekyll-paginate (~> 1.1)
       jekyll-sitemap (~> 1.3)
-    minitest (5.14.2)
+    minitest (5.15.0)
     multipart-post (2.1.1)
-    nokogiri (1.12.5)
-      mini_portile2 (~> 2.6.1)
+    nokogiri (1.13.3)
+      mini_portile2 (~> 2.8.0)
       racc (~> 1.4)
-    octokit (4.18.0)
+    octokit (4.22.0)
       faraday (>= 0.9)
       sawyer (~> 0.8.0, >= 0.5.3)
     pathutil (0.16.2)
       forwardable-extended (~> 2.6)
-    public_suffix (3.1.1)
-    racc (1.5.2)
-    rb-fsevent (0.10.4)
+    public_suffix (4.0.6)
+    racc (1.6.0)
+    rb-fsevent (0.11.1)
     rb-inotify (0.10.1)
       ffi (~> 1.0)
     rexml (3.2.5)
-    rouge (3.23.0)
-    ruby-enum (0.8.0)
+    rouge (3.26.0)
+    ruby-enum (0.9.0)
       i18n
-    ruby2_keywords (0.0.2)
-    rubyzip (2.3.0)
+    ruby2_keywords (0.0.5)
+    rubyzip (2.3.2)
     safe_yaml (1.0.5)
     sass (3.7.4)
       sass-listen (~> 4.0.0)
@@ -247,23 +268,23 @@ GEM
     sawyer (0.8.2)
       addressable (>= 2.3.5)
       faraday (> 0.8, < 2.0)
-    simpleidn (0.1.1)
+    simpleidn (0.2.1)
       unf (~> 0.1.4)
     terminal-table (1.8.0)
       unicode-display_width (~> 1.1, >= 1.1.1)
     thread_safe (0.3.6)
     typhoeus (1.4.0)
       ethon (>= 0.9.0)
-    tzinfo (1.2.7)
+    tzinfo (1.2.9)
       thread_safe (~> 0.1)
     tzinfo-data (1.2020.3)
       tzinfo (>= 1.0.0)
     unf (0.1.4)
       unf_ext
-    unf_ext (0.0.7.7)
-    unicode-display_width (1.7.0)
+    unf_ext (0.0.8)
+    unicode-display_width (1.8.0)
     wdm (0.1.1)
-    zeitwerk (2.4.0)
+    zeitwerk (2.5.4)
 
 PLATFORMS
   ruby
@@ -280,4 +301,4 @@ DEPENDENCIES
   wdm (~> 0.1.1)
 
 BUNDLED WITH
-   2.2.10
+   2.3.8
diff --git a/docs/_data/navigation.yml b/docs/_data/navigation.yml
index 9fa5e12b4d79..6f117f710aca 100755
--- a/docs/_data/navigation.yml
+++ b/docs/_data/navigation.yml
@@ -39,7 +39,7 @@ lnav:
         url: /docs/config-json/#communication-options
       - title: 'FP16'
         url: /docs/config-json/#fp16-training-options
-      - title: 'BFOAT16'
+      - title: 'BFLOAT16'
         url: /docs/config-json/#bfloat16-training-options
       - title: 'Gradient Clipping'
         url: /docs/config-json/#gradient-clipping
diff --git a/docs/_posts/2020-09-09-onebit-adam-blog-post.md b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
index ee25a73efa1c..413a3d0c1afb 100644
--- a/docs/_posts/2020-09-09-onebit-adam-blog-post.md
+++ b/docs/_posts/2020-09-09-onebit-adam-blog-post.md
@@ -2,7 +2,7 @@
 title: "DeepSpeed with 1-bit Adam: 5x less communication and 3.4x faster training"
 excerpt: ""
 date: 2020-09-09 00:00:00
-tags: training communication
+tags: training
 ---
 
 ## 1. Introduction
diff --git a/docs/_posts/2020-09-09-onebit-adam-news.md b/docs/_posts/2020-09-09-onebit-adam-news.md
index 19253ac76b00..03b8e1de2fdd 100644
--- a/docs/_posts/2020-09-09-onebit-adam-news.md
+++ b/docs/_posts/2020-09-09-onebit-adam-news.md
@@ -2,7 +2,7 @@
 title: "Up to 5x less communication and 3.4x faster training through 1-bit Adam"
 excerpt: ""
 date: 2020-09-09 00:00:00
-tags: training communication
+tags: training
 ---
 
 
diff --git a/docs/_sass/button-group.scss b/docs/_sass/button-group.scss
new file mode 100644
index 000000000000..c3eb17fe70da
--- /dev/null
+++ b/docs/_sass/button-group.scss
@@ -0,0 +1,68 @@
+.btn-group button {
+    padding: 5px 15px; /* Some padding */
+    cursor: pointer; /* Pointer/hand icon */
+    text-transform: capitalize;
+  }
+
+  /* Clear floats (clearfix hack) */
+  .btn-group:after {
+    content: "";
+    clear: both;
+    display: table;
+  }
+
+.button-71 {
+  background-color: #0092ca;
+  border: 0;
+  border-radius: 56px;
+  color: #fff;
+  cursor: pointer;
+  display: inline-block;
+  font-family: system-ui,-apple-system,system-ui,"Segoe UI",Roboto,Ubuntu,"Helvetica Neue",sans-serif;
+  font-size: 18px;
+  font-weight: 600;
+  outline: 0;
+  padding: 16px 21px;
+  position: relative;
+  text-align: center;
+  text-decoration: none;
+  transition: all .3s;
+  user-select: none;
+  -webkit-user-select: none;
+  touch-action: manipulation;
+  margin: 1px;
+}
+
+.button-71:before {
+  background-color: initial;
+  background-image: linear-gradient(#fff 0, rgba(255, 255, 255, 0) 100%);
+  border-radius: 125px;
+  content: "";
+  height: 50%;
+  left: 4%;
+  opacity: .5;
+  position: absolute;
+  top: 0;
+  transition: all .3s;
+  width: 92%;
+}
+
+.button-71:hover {
+  box-shadow: rgba(255, 255, 255, .2) 0 3px 15px inset, rgba(0, 0, 0, .1) 0 3px 5px, rgba(0, 0, 0, .1) 0 10px 13px;
+  transform: scale(1.05);
+}
+
+
+.button-71:focus {
+  border: 3px solid black;
+  box-shadow: rgba(131, 192, 253, 0.5) 0 0 0 3px;
+  transform: scale(1.05);
+  outline: none;
+}
+
+
+@media (min-width: 768px) {
+  .button-71 {
+    padding: 16px 48px;
+  }
+}
diff --git a/docs/assets/css/main.scss b/docs/assets/css/main.scss
index 4f31bd44dd40..5739da82947e 100644
--- a/docs/assets/css/main.scss
+++ b/docs/assets/css/main.scss
@@ -6,6 +6,7 @@
 
 @import "minimal-mistakes/skins/{{ site.minimal_mistakes_skin | default: 'default' }}"; // skin
 @import "minimal-mistakes"; // main partials
+@import "button-group"; // main partials
 
 //
 // DeepSpeed customizations
@@ -46,66 +47,21 @@
   }
 }
 
-/* CSS */
-.button-15 {
-  background-image: linear-gradient(#42A1EC, #0070C9);
-  border: 1px solid #0077CC;
-  border-radius: 4px;
-  box-sizing: border-box;
-  color: #FFFFFF;
-  cursor: pointer;
-  direction: ltr;
-  display: block;
-  font-family: "SF Pro Text","SF Pro Icons","AOS Icons","Helvetica Neue",Helvetica,Arial,sans-serif;
-  font-size: 17px;
-  font-weight: 400;
-  letter-spacing: -.022em;
-  line-height: 1.47059;
-  min-width: 30px;
-  overflow: visible;
-  padding: 4px 15px;
-  text-align: center;
-  vertical-align: baseline;
-  user-select: none;
-  -webkit-user-select: none;
-  touch-action: manipulation;
-  white-space: nowrap;
-}
-
-.button-15:disabled {
-  cursor: default;
-  opacity: .3;
-}
-
-.button-15:hover {
-  background-image: linear-gradient(#51A9EE, #147BCD);
-  border-color: #1482D0;
-  text-decoration: none;
-}
-
-.button-15:active {
-  background-image: linear-gradient(#3D94D9, #0067B9);
-  border-color: #006DBC;
-  outline: none;
-}
-
-.button-15:focus {
-  box-shadow: rgba(131, 192, 253, 0.5) 0 0 0 3px;
-  outline: none;
-}
-
 ul.tag-box li {
   display: inline-block;
   list-style: none;
   list-style-image: none;
-  margin-bottom: 7px;
+  margin-bottom: 10px;
+  text-transform: capitalize;
 }
 ul.tag-box li a {
   background: #e6e6e6;
-  padding: 4px 8px;
+  padding: 2px 8px;
   border-radius: 3px;
-  color: #f76b48;
+  color:  #0092ca;
+  text-transform: capitalize;
+  font-weight: bold;
 }
 ul.tag-box li span.size {
-  font-weight: 300;
-}
\ No newline at end of file
+  font-weight: bold;
+}
diff --git a/docs/tags.md b/docs/tags.md
index 54c3f9c3cf69..ec983b5115b8 100644
--- a/docs/tags.md
+++ b/docs/tags.md
@@ -21,14 +21,14 @@ permalink: /posts/
           : 'none';
       {% endfor %}
     }
-  </script>
+</script>
 
-  <div>
-    <button id="All" onclick="filterUsingCategory('All')">*Show All Posts*</button>
+  <div class="btn-group">
+    <button id="All" class="button-71" role="button" onclick="filterUsingCategory('All')">All</button>
     {% assign tags = site.tags | sort %}
     {% for category in tags %}
       {% assign cat = category | first %}
-      <button id="{{ cat }}" onclick="filterUsingCategory(this.id)">{{ cat }}</button>
+      <button id="{{ cat }}" class="button-71" role="button" onclick="filterUsingCategory(this.id)">{{ cat }}</button>
     {% endfor %}
     <hr />
   </div>
diff --git a/docs/tags_list.md b/docs/tags_list.md
index c56491ae1550..a9ec54c8fe86 100644
--- a/docs/tags_list.md
+++ b/docs/tags_list.md
@@ -16,7 +16,9 @@ permalink: /tags/
   {% assign t = tag | first %}
   {% assign posts = tag | last %}
 
+<div style="text-transform:capitalize;">
 <h4 id="{{ t | downcase }}">{{ t }}</h4>
+</div>
 <ul>
 {% for post in posts %}
   {% if post.tags contains t %}

From da303ff2a3150e5d0bab06a5602880449d61001c Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Mon, 28 Feb 2022 23:57:30 +0500
Subject: [PATCH 06/20] add tagging list view

---
 docs/tags.md      | 13 ++++++-------
 docs/tags_list.md | 12 +++++++++---
 2 files changed, 15 insertions(+), 10 deletions(-)

diff --git a/docs/tags.md b/docs/tags.md
index ec983b5115b8..5600b08d00ce 100644
--- a/docs/tags.md
+++ b/docs/tags.md
@@ -39,13 +39,12 @@ permalink: /posts/
       {% assign id = id | plus:1 %}
       <div class="post" id="{{id}}">
         <p class="itemInteriorSection">
-          <a href="{{post.url}}">{{ post.articletitle }}</a>
-            {%- unless post.hidden -%}
-              {% include archive-single.html %}
-              {% if post.image %}
-                <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
-              {% endif %}
-            {%- endunless -%}
+          {%- unless post.hidden -%}
+            {% include archive-single.html %}
+            {% if post.image %}
+              <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
+            {% endif %}
+          {%- endunless -%}
         </p>
       </div>
     {% endfor %}
diff --git a/docs/tags_list.md b/docs/tags_list.md
index a9ec54c8fe86..2309f3981392 100644
--- a/docs/tags_list.md
+++ b/docs/tags_list.md
@@ -22,9 +22,15 @@ permalink: /tags/
 <ul>
 {% for post in posts %}
   {% if post.tags contains t %}
-    <li>
-       <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.url }}">{{ post.title }}</a>
-    </li>
+    {% if post.link %}
+      <li>
+        <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.link }}">{{ post.title }}</a>
+      </li>
+    {% else %}
+      <li>
+        <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.url }}">{{ post.title }}</a>
+      </li>
+    {% endif %}
   {% endif %}
 {% endfor %}
 </ul>

From 718362a6082a7f3f5d75af276bb2dc04d2535982 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Tue, 1 Mar 2022 00:52:52 +0500
Subject: [PATCH 07/20] add count to tags

---
 docs/tags.md      |  4 ++--
 docs/tags_list.md | 39 +++++++++++++++++++--------------------
 2 files changed, 21 insertions(+), 22 deletions(-)

diff --git a/docs/tags.md b/docs/tags.md
index 5600b08d00ce..015f1a4bcb44 100644
--- a/docs/tags.md
+++ b/docs/tags.md
@@ -24,11 +24,11 @@ permalink: /posts/
 </script>
 
   <div class="btn-group">
-    <button id="All" class="button-71" role="button" onclick="filterUsingCategory('All')">All</button>
+    <button id="All" class="button-71" role="button" onclick="filterUsingCategory('All')">All ({{ posts.size }})</button>
     {% assign tags = site.tags | sort %}
     {% for category in tags %}
       {% assign cat = category | first %}
-      <button id="{{ cat }}" class="button-71" role="button" onclick="filterUsingCategory(this.id)">{{ cat }}</button>
+      <button id="{{ cat }}" class="button-71" role="button" onclick="filterUsingCategory(this.id)">{{ cat }} ({{ site.tags[cat].size }})</button>
     {% endfor %}
     <hr />
   </div>
diff --git a/docs/tags_list.md b/docs/tags_list.md
index 2309f3981392..532cd0c62ea6 100644
--- a/docs/tags_list.md
+++ b/docs/tags_list.md
@@ -7,31 +7,30 @@ permalink: /tags/
 <ul class="tag-box">
 	{% for tag in sorted_tags %}
 		{% assign t = tag | first %}
-		{% assign posts = tag | last %}
-		<li><a href="#{{ t | downcase }}">{{ t }} <span class="size">({{ posts.size }})</span></a></li>
+		{% assign ps = tag | last %}
+		<li><a href="#{{ t | downcase }}">{{ t }} <span class="size">({{ ps.size }})</span></a></li>
 	{% endfor %}
 </ul>
 
 {% for tag in sorted_tags %}
   {% assign t = tag | first %}
   {% assign posts = tag | last %}
-
-<div style="text-transform:capitalize;">
-<h4 id="{{ t | downcase }}">{{ t }}</h4>
-</div>
-<ul>
-{% for post in posts %}
-  {% if post.tags contains t %}
-    {% if post.link %}
-      <li>
-        <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.link }}">{{ post.title }}</a>
-      </li>
-    {% else %}
-      <li>
-        <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.url }}">{{ post.title }}</a>
-      </li>
+  <div style="text-transform:capitalize;">
+    <h4 id="{{ t | downcase }}">{{ t }}</h4>
+  </div>
+  <ul>
+  {% for post in posts %}
+    {% if post.tags contains t %}
+      {% if post.link %}
+        <li>
+          <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.link }}">{{ post.title }}</a>
+        </li>
+      {% else %}
+        <li>
+          <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.url }}">{{ post.title }}</a>
+        </li>
+      {% endif %}
     {% endif %}
-  {% endif %}
-{% endfor %}
-</ul>
+  {% endfor %}
+  </ul>
 {% endfor %}

From 7d3c3fe149f8e0d436a6f922918e96ee7b4a7793 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Tue, 1 Mar 2022 00:59:25 +0500
Subject: [PATCH 08/20] add moe inference tutorial

---
 ...{moe-inference-tutorial.md => mixture-of-experts-inference.md} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename docs/_tutorials/{moe-inference-tutorial.md => mixture-of-experts-inference.md} (100%)

diff --git a/docs/_tutorials/moe-inference-tutorial.md b/docs/_tutorials/mixture-of-experts-inference.md
similarity index 100%
rename from docs/_tutorials/moe-inference-tutorial.md
rename to docs/_tutorials/mixture-of-experts-inference.md

From 4d14f0c1862d2511d21e332e62a2279fe591bd61 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Tue, 1 Mar 2022 01:01:52 +0500
Subject: [PATCH 09/20] fix typo

---
 docs/_config.yml          | 1 +
 docs/_data/navigation.yml | 2 ++
 2 files changed, 3 insertions(+)

diff --git a/docs/_config.yml b/docs/_config.yml
index e5642cbfcded..bb545716cec6 100644
--- a/docs/_config.yml
+++ b/docs/_config.yml
@@ -45,6 +45,7 @@ collections:
       - megatron.md
       - mixture-of-experts.md
       - mixture-of-experts-nlg.md
+      - moe-inference.md
       - one-cycle.md
       - onebit-adam.md
       - onebit-lamb.md
diff --git a/docs/_data/navigation.yml b/docs/_data/navigation.yml
index 6f117f710aca..21bf5fc14a20 100755
--- a/docs/_data/navigation.yml
+++ b/docs/_data/navigation.yml
@@ -96,6 +96,8 @@ lnav:
         url: /tutorials/mixture-of-experts/
       - title: 'Mixture-of-Experts for NLG'
         url: /tutorials/mixture-of-experts-nlg/
+      - title: 'Mixture-of-Experts Inference'
+        url: /tutorials/mixture-of-experts-inference/
       - title: 'Mixture-of-Quantization'
         url: /tutorials/MoQ-tutorial/
       - title: 'One-Cycle Schedule'

From 632453c852df44a04d461becdd88ce84e5ac090a Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Tue, 1 Mar 2022 03:28:20 +0500
Subject: [PATCH 10/20] fix format

---
 docs/_includes/analytics.html                   | 2 +-
 docs/_includes/author-profile-custom-links.html | 2 +-
 docs/_includes/category-list.html               | 2 +-
 docs/_includes/group-by-array                   | 2 +-
 docs/_includes/page__taxonomy.html              | 2 +-
 docs/_includes/post_pagination.html             | 2 +-
 docs/_includes/tag-list.html                    | 2 +-
 docs/_includes/toc                              | 2 +-
 docs/tags.md                                    | 2 --
 9 files changed, 8 insertions(+), 10 deletions(-)

diff --git a/docs/_includes/analytics.html b/docs/_includes/analytics.html
index 371469f0af9b..5c85236124c2 100644
--- a/docs/_includes/analytics.html
+++ b/docs/_includes/analytics.html
@@ -11,4 +11,4 @@
   {% include /analytics-providers/custom.html %}
 {% endcase %}
 
-{% endif %}
\ No newline at end of file
+{% endif %}
diff --git a/docs/_includes/author-profile-custom-links.html b/docs/_includes/author-profile-custom-links.html
index b89ffcb7df6c..06e0b630f688 100644
--- a/docs/_includes/author-profile-custom-links.html
+++ b/docs/_includes/author-profile-custom-links.html
@@ -4,4 +4,4 @@
       <i class="fas fa-fw" aria-hidden="true"></i> Custom Social Profile Link
     </a>
   </li>
--->
\ No newline at end of file
+-->
diff --git a/docs/_includes/category-list.html b/docs/_includes/category-list.html
index d684a2829f3b..4f38f11b51e8 100644
--- a/docs/_includes/category-list.html
+++ b/docs/_includes/category-list.html
@@ -23,4 +23,4 @@
     {% endfor %}
     </span>
   </p>
-{% endif %}
\ No newline at end of file
+{% endif %}
diff --git a/docs/_includes/group-by-array b/docs/_includes/group-by-array
index 708de41ae3f8..528e40b106c6 100644
--- a/docs/_includes/group-by-array
+++ b/docs/_includes/group-by-array
@@ -44,4 +44,4 @@
 
 <!-- Push to group_items -->
 {% assign group_items = group_items | push: __item %}
-{% endfor %}
\ No newline at end of file
+{% endfor %}
diff --git a/docs/_includes/page__taxonomy.html b/docs/_includes/page__taxonomy.html
index 75c76c81ddf2..f10b2026a22b 100644
--- a/docs/_includes/page__taxonomy.html
+++ b/docs/_includes/page__taxonomy.html
@@ -4,4 +4,4 @@
 
 {% if site.category_archive.type and page.categories[0] %}
   {% include category-list.html %}
-{% endif %}
\ No newline at end of file
+{% endif %}
diff --git a/docs/_includes/post_pagination.html b/docs/_includes/post_pagination.html
index a93c6279763b..c09dd29f0345 100644
--- a/docs/_includes/post_pagination.html
+++ b/docs/_includes/post_pagination.html
@@ -11,4 +11,4 @@
       <a href="#" class="pagination--pager disabled">{{ site.data.ui-text[site.locale].pagination_next | default: "Next" }}</a>
     {% endif %}
   </nav>
-{% endif %}
\ No newline at end of file
+{% endif %}
diff --git a/docs/_includes/tag-list.html b/docs/_includes/tag-list.html
index e0d02bfa561a..18ee8bdf1d00 100644
--- a/docs/_includes/tag-list.html
+++ b/docs/_includes/tag-list.html
@@ -23,4 +23,4 @@
     {% endfor %}
     </span>
   </p>
-{% endif %}
\ No newline at end of file
+{% endif %}
diff --git a/docs/_includes/toc b/docs/_includes/toc
index 6423ccdc72e1..a234afafad40 100644
--- a/docs/_includes/toc
+++ b/docs/_includes/toc
@@ -4,4 +4,4 @@
 *  Auto generated table of contents
 {:toc .toc__menu}
 </nav>
-</aside>
\ No newline at end of file
+</aside>
diff --git a/docs/tags.md b/docs/tags.md
index 015f1a4bcb44..035f6cfe153d 100644
--- a/docs/tags.md
+++ b/docs/tags.md
@@ -49,5 +49,3 @@ permalink: /posts/
       </div>
     {% endfor %}
   </div>
-
-

From 921ed10fed884b592a4d9a0ea79692d49afbf30a Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Tue, 1 Mar 2022 07:25:25 +0500
Subject: [PATCH 11/20] tagging tutorials

---
 docs/_pages/tutorials-landing.md              | 45 ++++++++++++++++++-
 docs/_sass/button-group.scss                  |  4 +-
 docs/_tutorials/MoQ-tutorial.md               |  1 +
 docs/_tutorials/advanced-install.md           |  1 +
 docs/_tutorials/autotuning.md                 |  1 +
 docs/_tutorials/azure.md                      |  1 +
 docs/_tutorials/bert-finetuning.md            |  1 +
 docs/_tutorials/bert-pretraining.md           |  1 +
 docs/_tutorials/cifar-10.md                   |  1 +
 docs/_tutorials/curriculum-learning.md        |  1 +
 docs/_tutorials/flops-profiler.md             |  1 +
 docs/_tutorials/gan.md                        |  1 +
 docs/_tutorials/getting-started.md            |  2 +-
 docs/_tutorials/inference-tutorial.md         |  1 +
 docs/_tutorials/large-models-w-deepspeed.md   |  1 +
 docs/_tutorials/lrrt.md                       |  1 +
 docs/_tutorials/megatron.md                   |  1 +
 .../mixture-of-experts-inference.md           |  1 +
 docs/_tutorials/mixture-of-experts-nlg.md     |  1 +
 docs/_tutorials/mixture-of-experts.md         |  1 +
 docs/_tutorials/one-cycle.md                  |  1 +
 docs/_tutorials/onebit-adam.md                |  1 +
 docs/_tutorials/onebit-lamb.md                |  1 +
 docs/_tutorials/pipeline.md                   |  1 +
 docs/_tutorials/progressive_layer_dropping.md |  2 +-
 docs/_tutorials/pytorch-profiler.md           |  1 +
 docs/_tutorials/sparse-attention.md           |  1 +
 docs/_tutorials/transformer_kernel.md         |  3 +-
 docs/_tutorials/zero-offload.md               |  1 +
 docs/_tutorials/zero.md                       |  1 +
 docs/tags.md                                  |  7 +--
 31 files changed, 77 insertions(+), 11 deletions(-)

diff --git a/docs/_pages/tutorials-landing.md b/docs/_pages/tutorials-landing.md
index 5447e137c9fd..c7d6af66f411 100644
--- a/docs/_pages/tutorials-landing.md
+++ b/docs/_pages/tutorials-landing.md
@@ -1,6 +1,49 @@
 ---
 title: "Tutorials"
-layout: collection
+layout: archive
 collection: tutorials
 permalink: /tutorials/
 ---
+
+
+{% if paginator %}
+  {% assign tutorials = paginator.tutorials %}
+{% else %}
+  {% assign tutorials = site.tutorials %}
+{% endif %}
+
+<script type="text/javascript">
+    function filterTutorialsUsingCategory(selectedCategory) {
+      {% for tutorial in tutorials %}
+        var cats = {{ tutorial.tags | jsonify }}
+        var tutorialDiv = document.getElementById("tutorial-{{tutorial.title | slugify}}");
+        tutorialDiv.style.display = (selectedCategory == 'All' || cats.includes(selectedCategory))
+          ? 'unset'
+          : 'none';
+      {% endfor %}
+    }
+</script>
+
+  <div class="btn-group">
+    <button id="All" class="button-71" role="button" onclick="filterTutorialsUsingCategory('All')">All ({{ tutorials.size }})</button>
+    {% assign tags = site.tutorials | map: 'tags' | join: ','  | split: ','  | group_by: tag %}
+    {% for cat in tags %} <!-- of the form {"name":"","items":[],"size":N}-->
+      <button id="{{ cat.name }}" class="button-71" role="button" onclick="filterTutorialsUsingCategory(this.id)">{{ cat.name }} ({{ cat.size }})</button>
+    {% endfor %}
+    <hr />
+  </div>
+  <div class="tutorials-wrapper">
+    {% for tutorial in tutorials %}
+      {% assign post = tutorial %}
+      <div class="tutorial" id="tutorial-{{tutorial.title | slugify}}">
+        <p class="itemInteriorSection">
+          {%- unless tutorial.hidden -%}
+            {% include archive-single.html %}
+            {% if tutorial.image %}
+              <a href="{{ tutorial.link }}"><img src="{{ tutorial.image }}"></a>
+            {% endif %}
+          {%- endunless -%}
+        </p>
+      </div>
+    {% endfor %}
+  </div>
diff --git a/docs/_sass/button-group.scss b/docs/_sass/button-group.scss
index c3eb17fe70da..ced944f51db0 100644
--- a/docs/_sass/button-group.scss
+++ b/docs/_sass/button-group.scss
@@ -19,10 +19,10 @@
   cursor: pointer;
   display: inline-block;
   font-family: system-ui,-apple-system,system-ui,"Segoe UI",Roboto,Ubuntu,"Helvetica Neue",sans-serif;
-  font-size: 18px;
+  font-size: 16px;
   font-weight: 600;
   outline: 0;
-  padding: 16px 21px;
+  padding: 16px 16px;
   position: relative;
   text-align: center;
   text-decoration: none;
diff --git a/docs/_tutorials/MoQ-tutorial.md b/docs/_tutorials/MoQ-tutorial.md
index d2abb3f11619..8776ee6f3775 100644
--- a/docs/_tutorials/MoQ-tutorial.md
+++ b/docs/_tutorials/MoQ-tutorial.md
@@ -1,5 +1,6 @@
 ---
 title: "DeepSpeed Mixture-of-Quantization (MoQ)"
+tags: training quantization
 ---
 
 DeepSpeed introduces new support for model compression using quantization, called Mixture-of-Quantization (MoQ).  MoQ is designed on top of QAT (Quantization-Aware Training), with the difference that it schedules various data precisions across the training process. It starts with quantizing the model with a high precision, such as FP16 or 16-bit quantization, and reduce the precision through a pre-defined schedule until reaching the target quantization bits (like 8-bit). Moreover, we use second-order information of the model parameters to dynamically adjust the quantization schedule for each of layer of the network separately. We have seen that by adding such schedule and using various data precision in the training process, we can quantize the model with better quality and preserve accuracy. For a better understanding of MoQ methodology, please refer to MoQ deep-dive, [here](https://www.deepspeed.ai/posts/2021-05-05-MoQ/).
diff --git a/docs/_tutorials/advanced-install.md b/docs/_tutorials/advanced-install.md
index e8242c734341..fe950d0ff5f1 100755
--- a/docs/_tutorials/advanced-install.md
+++ b/docs/_tutorials/advanced-install.md
@@ -1,6 +1,7 @@
 ---
 title: "Installation Details"
 date: 2020-10-28
+tags: getting-started
 ---
 
 The quickest way to get started with DeepSpeed is via pip, this will install
diff --git a/docs/_tutorials/autotuning.md b/docs/_tutorials/autotuning.md
index 1354a7571396..303087d298a7 100644
--- a/docs/_tutorials/autotuning.md
+++ b/docs/_tutorials/autotuning.md
@@ -1,6 +1,7 @@
 ---
 title: "Autotuning"
 excerpt: "Automatically discover the optimal DeepSpeed configuration that delivers good training speed"
+tags: training performance-tuning
 ---
 
 Make sure you've read the DeepSpeed tutorials on [Getting Started](https://www.deepspeed.ai/getting-started/) and [Zero Redundancy Optimizer](https://www.deepspeed.ai/tutorials/zero/) before stepping through this tutorial.
diff --git a/docs/_tutorials/azure.md b/docs/_tutorials/azure.md
index ee6962b3ba99..1016aeafd007 100644
--- a/docs/_tutorials/azure.md
+++ b/docs/_tutorials/azure.md
@@ -1,5 +1,6 @@
 ---
 title: "Getting Started with DeepSpeed on Azure"
+tags: getting-started
 ---
 
 This tutorial will help you get started running DeepSpeed on [Azure virtual
diff --git a/docs/_tutorials/bert-finetuning.md b/docs/_tutorials/bert-finetuning.md
index 24e4fa167ddc..f7ea8226022e 100755
--- a/docs/_tutorials/bert-finetuning.md
+++ b/docs/_tutorials/bert-finetuning.md
@@ -1,6 +1,7 @@
 ---
 title: "BingBertSQuAD Fine-tuning"
 excerpt: ""
+tags: training fine-tuning
 ---
 
 In this tutorial we will be adding DeepSpeed to the BingBert model for the SQuAD fine-tuning task, called "BingBertSquad" henceforth. We will also demonstrate performance gains.
diff --git a/docs/_tutorials/bert-pretraining.md b/docs/_tutorials/bert-pretraining.md
index 0791fb3308fe..e3771b7fdad2 100755
--- a/docs/_tutorials/bert-pretraining.md
+++ b/docs/_tutorials/bert-pretraining.md
@@ -1,6 +1,7 @@
 ---
 title: "BERT Pre-training"
 excerpt: ""
+tags: training pre-training
 ---
 
 In this tutorial we will apply DeepSpeed to pre-train the BERT
diff --git a/docs/_tutorials/cifar-10.md b/docs/_tutorials/cifar-10.md
index c7b53e58357a..11a05a78a749 100644
--- a/docs/_tutorials/cifar-10.md
+++ b/docs/_tutorials/cifar-10.md
@@ -1,6 +1,7 @@
 ---
 title: "CIFAR-10 Tutorial"
 excerpt: "Train your first model with DeepSpeed!"
+tags: getting-started
 ---
 
 If you haven't already, we advise you to first read through the
diff --git a/docs/_tutorials/curriculum-learning.md b/docs/_tutorials/curriculum-learning.md
index 577ec5c66031..938955ab57cc 100644
--- a/docs/_tutorials/curriculum-learning.md
+++ b/docs/_tutorials/curriculum-learning.md
@@ -1,5 +1,6 @@
 ---
 title: "Curriculum Learning: A Regularization Method for Efficient and Stable Billion-Scale GPT Model Pre-Training"
+tags: training pre-training
 ---
 
 **Note:**
diff --git a/docs/_tutorials/flops-profiler.md b/docs/_tutorials/flops-profiler.md
index 504ee9222fd1..b90a55efcada 100644
--- a/docs/_tutorials/flops-profiler.md
+++ b/docs/_tutorials/flops-profiler.md
@@ -1,6 +1,7 @@
 ---
 title: "Flops Profiler"
 excerpt: "Measure the parameters, latency, and floating-point operations of your model"
+tags: profiling performance-tuning
 ---
 
 In this tutorial, we introduce the DeepSpeed Flops Profiler and provide examples of its usage.
diff --git a/docs/_tutorials/gan.md b/docs/_tutorials/gan.md
index d880f48db28e..1389c91617dd 100755
--- a/docs/_tutorials/gan.md
+++ b/docs/_tutorials/gan.md
@@ -1,6 +1,7 @@
 ---
 title: "DCGAN Tutorial"
 excerpt: "Train your first GAN model with DeepSpeed!"
+tags: getting-started training
 ---
 
 If you haven't already, we advise you to first read through the [Getting Started](/getting-started/) guide before stepping through this
diff --git a/docs/_tutorials/getting-started.md b/docs/_tutorials/getting-started.md
index 1e45babd569b..fe765d2713b9 100644
--- a/docs/_tutorials/getting-started.md
+++ b/docs/_tutorials/getting-started.md
@@ -2,7 +2,7 @@
 title: 'Getting Started'
 permalink: /getting-started/
 excerpt: 'First steps with DeepSpeed'
-date: 2020-05-15
+tags: getting-started
 ---
 
 ## Installation
diff --git a/docs/_tutorials/inference-tutorial.md b/docs/_tutorials/inference-tutorial.md
index 43aa45dd8bf7..253bb7092467 100644
--- a/docs/_tutorials/inference-tutorial.md
+++ b/docs/_tutorials/inference-tutorial.md
@@ -1,5 +1,6 @@
 ---
 title: "Getting Started with DeepSpeed for Inferencing Transformer based Models"
+tags: inference
 ---
 
 DeepSpeed-Inference introduces several features to efficiently serve transformer-based PyTorch models. It supports model parallelism (MP) to fit large models that would otherwise not fit in GPU memory. Even for smaller models, MP can be used to reduce latency for inference. To further reduce latency and cost, we introduce inference-customized kernels. Finally, we propose a novel approach to quantize models, called MoQ, to both shrink the model and reduce the inference cost at production. For more details on the inference related optimizations in DeepSpeed, please refer to our [blog post](https://www.microsoft.com/en-us/research/blog/deepspeed-accelerating-large-scale-model-inference-and-training-via-system-optimizations-and-compression/).
diff --git a/docs/_tutorials/large-models-w-deepspeed.md b/docs/_tutorials/large-models-w-deepspeed.md
index a7a3d66579c1..177199304a5c 100644
--- a/docs/_tutorials/large-models-w-deepspeed.md
+++ b/docs/_tutorials/large-models-w-deepspeed.md
@@ -1,5 +1,6 @@
 ---
 title: "Training your large model with DeepSpeed"
+tags: training
 ---
 
 ## Overview
diff --git a/docs/_tutorials/lrrt.md b/docs/_tutorials/lrrt.md
index d2e1e4051934..1659ab5bbd4d 100644
--- a/docs/_tutorials/lrrt.md
+++ b/docs/_tutorials/lrrt.md
@@ -1,5 +1,6 @@
 ---
 title: "Learning Rate Range Test"
+tags: training learning-rate
 ---
 This tutorial shows how to use to perform Learning Rate range tests in PyTorch.
 
diff --git a/docs/_tutorials/megatron.md b/docs/_tutorials/megatron.md
index 4d9846c0e329..7d81ecdcd28d 100644
--- a/docs/_tutorials/megatron.md
+++ b/docs/_tutorials/megatron.md
@@ -1,5 +1,6 @@
 ---
 title: "Megatron-LM GPT2"
+tags: training
 ---
 
 If you haven't already, we advise you to first read through the [Getting
diff --git a/docs/_tutorials/mixture-of-experts-inference.md b/docs/_tutorials/mixture-of-experts-inference.md
index 7a170eddd113..42df78dd0cfc 100644
--- a/docs/_tutorials/mixture-of-experts-inference.md
+++ b/docs/_tutorials/mixture-of-experts-inference.md
@@ -1,5 +1,6 @@
 ---
 title: "Getting Started with DeepSpeed-MoE for Inferencing Large-Scale MoE Models"
+tags: MoE inference
 ---
 
 DeepSpeed-MoE Inference introduces several important features on top of the inference optimization for dense models ([DeepSpeed-Inference blog post](https://www.microsoft.com/en-us/research/blog/deepspeed-accelerating-large-scale-model-inference-and-training-via-system-optimizations-and-compression/)). It embraces several different types of parallelism, i.e. data-parallelism and tensor-slicing for the non-expert parameters and expert-parallelism and expert-slicing for the expert parameters. To maximize the aggregate memory-bandwidth, we provide the communication scheduling with parallelism coordination to effectively group and route tokens with the same critical-data-path. Moreover, we propose new modeling optimizations, PR-MoE and MoS, to reduce MoE model size while maintaining accuracy. For more information on the DeepSpeed MoE inference optimization, please refer to our [blog post]({{ site.press_release_v6 }}).
diff --git a/docs/_tutorials/mixture-of-experts-nlg.md b/docs/_tutorials/mixture-of-experts-nlg.md
index f384ab645660..e9239a7156a2 100644
--- a/docs/_tutorials/mixture-of-experts-nlg.md
+++ b/docs/_tutorials/mixture-of-experts-nlg.md
@@ -1,5 +1,6 @@
 ---
 title: "Mixture of Experts for NLG models"
+tags: MoE training
 ---
 
 In this tutorial, we introduce how to apply DeepSpeed Mixture of Experts (MoE) to NLG models, which reduces the training cost by 5 times and reduce the MoE model size by 3 times (details in our [Blog]({{ site.press_release_v6 }})). We use the GPT-3 like models in Megatron-LM framework as the example. Before reading this tutorial, we recommend to first read the tutorials about [Mixture of Experts](/tutorials/mixture-of-experts/) and [Megatron-LM GPT pre-training](/tutorials/megatron/).
diff --git a/docs/_tutorials/mixture-of-experts.md b/docs/_tutorials/mixture-of-experts.md
index 8485f1547c6a..23d807ab3eb1 100644
--- a/docs/_tutorials/mixture-of-experts.md
+++ b/docs/_tutorials/mixture-of-experts.md
@@ -1,5 +1,6 @@
 ---
 title: "Mixture of Experts"
+tags: MoE training
 ---
 
 DeepSpeed v0.5 introduces new support for training Mixture of Experts (MoE) models. MoE models are an emerging class of sparsely activated models that have sublinear compute costs with respect to their parameters. For example, the [Switch Transformer](https://arxiv.org/abs/2101.03961) consists of over 1.6 trillion parameters, while the compute required to train it is approximately equal to that of a 10 billion-parameter dense model. This increase in model size offers tremendous accuracy gains for a constant compute budget.
diff --git a/docs/_tutorials/one-cycle.md b/docs/_tutorials/one-cycle.md
index 560f637b4763..12967ad56ad5 100644
--- a/docs/_tutorials/one-cycle.md
+++ b/docs/_tutorials/one-cycle.md
@@ -1,5 +1,6 @@
 ---
 title: "1-Cycle Schedule"
+tags: training learning-rate
 ---
 
 This tutorial shows how to implement 1Cycle schedules for learning rate and
diff --git a/docs/_tutorials/onebit-adam.md b/docs/_tutorials/onebit-adam.md
index df3a7ba926c9..20df2b99d9fb 100644
--- a/docs/_tutorials/onebit-adam.md
+++ b/docs/_tutorials/onebit-adam.md
@@ -1,5 +1,6 @@
 ---
 title: "1-bit Adam: Up to 5x less communication volume and up to 3.4x faster training"
+tags: training IO
 ---
 
 **Note:**
diff --git a/docs/_tutorials/onebit-lamb.md b/docs/_tutorials/onebit-lamb.md
index f6d9341d9095..822f79e61740 100644
--- a/docs/_tutorials/onebit-lamb.md
+++ b/docs/_tutorials/onebit-lamb.md
@@ -1,5 +1,6 @@
 ---
 title: "1-bit LAMB: Communication Efficient Large-Scale Large-Batch Training with LAMB's Convergence Speed"
+tags: training IO
 ---
 
 **Watch out!**
diff --git a/docs/_tutorials/pipeline.md b/docs/_tutorials/pipeline.md
index 1751846830ef..4454de00038f 100644
--- a/docs/_tutorials/pipeline.md
+++ b/docs/_tutorials/pipeline.md
@@ -1,5 +1,6 @@
 ---
 title: "Pipeline Parallelism"
+tags: training
 ---
 
 DeepSpeed v0.3 includes new support for pipeline parallelism! Pipeline
diff --git a/docs/_tutorials/progressive_layer_dropping.md b/docs/_tutorials/progressive_layer_dropping.md
index 8c184dfc6d21..b7b868bf29d3 100755
--- a/docs/_tutorials/progressive_layer_dropping.md
+++ b/docs/_tutorials/progressive_layer_dropping.md
@@ -1,6 +1,6 @@
 ---
 title: "Accelerating Training of Transformer-Based Language Models with Progressive Layer Dropping"
-
+tags: training
 ---
 
 In this tutorial, we are going to introduce the progressive layer dropping (PLD) in DeepSpeed and provide examples on how to use PLD. PLD allows to train Transformer networks such as BERT 24% faster under the same number of samples and 2.5 times faster to get similar accuracy on downstream tasks. Detailed description of PLD and the experimental results are available in our [technical report](https://arxiv.org/pdf/2010.13369.pdf).
diff --git a/docs/_tutorials/pytorch-profiler.md b/docs/_tutorials/pytorch-profiler.md
index 7389f9b1e61f..a9a9f58d6e32 100644
--- a/docs/_tutorials/pytorch-profiler.md
+++ b/docs/_tutorials/pytorch-profiler.md
@@ -1,5 +1,6 @@
 ---
 title: "Using PyTorch Profiler with DeepSpeed for performance debugging"
+tags: profiling performance-tuning
 ---
 
 This tutorial describes how to use [PyTorch Profiler](https://pytorch.org/blog/introducing-pytorch-profiler-the-new-and-improved-performance-tool/) with DeepSpeed.
diff --git a/docs/_tutorials/sparse-attention.md b/docs/_tutorials/sparse-attention.md
index 8905b38debbc..bad6bf627d90 100644
--- a/docs/_tutorials/sparse-attention.md
+++ b/docs/_tutorials/sparse-attention.md
@@ -1,5 +1,6 @@
 ---
 title: "DeepSpeed  Sparse Attention"
+tags: training
 ---
 
 In this tutorial we describe how to use DeepSpeed Sparse Attention (SA) and its building-block kernels. The easiest way to use SA is through DeepSpeed launcher. We will describe this through an example in [How to use sparse attention with DeepSpeed launcher](#how-to-use-sparse-attention-with-deepspeed-launcher) section. But before that, we introduce modules provided by DeepSpeed SA in the [next](#sparse-attention-modules) section.
diff --git a/docs/_tutorials/transformer_kernel.md b/docs/_tutorials/transformer_kernel.md
index 9dbcf26e2a12..915117fc3af9 100755
--- a/docs/_tutorials/transformer_kernel.md
+++ b/docs/_tutorials/transformer_kernel.md
@@ -1,5 +1,6 @@
 ---
-title: "DeepSpeed  Transformer Kernel"
+title: "DeepSpeed Transformer Kernel"
+tags: training
 ---
 
 This tutorial shows how to enable the DeepSpeed transformer kernel and set its different configuration parameters.
diff --git a/docs/_tutorials/zero-offload.md b/docs/_tutorials/zero-offload.md
index a1b05451f96d..7102f0667477 100644
--- a/docs/_tutorials/zero-offload.md
+++ b/docs/_tutorials/zero-offload.md
@@ -1,5 +1,6 @@
 ---
 title: "ZeRO-Offload"
+tags: training IO
 ---
 ZeRO-3 Offload consists of a subset of features in our newly released ZeRO-Infinity. Read our [ZeRO-Infinity blog](https://www.microsoft.com/en-us/research/blog/zero-infinity-and-deepspeed-unlocking-unprecedented-model-scale-for-deep-learning-training/) to learn more!
 
diff --git a/docs/_tutorials/zero.md b/docs/_tutorials/zero.md
index 7721f45ece4f..9f858a067162 100644
--- a/docs/_tutorials/zero.md
+++ b/docs/_tutorials/zero.md
@@ -1,5 +1,6 @@
 ---
 title: "Zero Redundancy Optimizer (ZeRO)"
+tags: training
 ---
 If you have not done so already, we advise that you read the DeepSpeed tutorials on [Getting Started](/getting-started/) and [Megatron-LM GPT-2](/tutorials/megatron/) before stepping through this tutorial.
 
diff --git a/docs/tags.md b/docs/tags.md
index 035f6cfe153d..fb704ffaa808 100644
--- a/docs/tags.md
+++ b/docs/tags.md
@@ -11,11 +11,10 @@ permalink: /posts/
 
 <script type="text/javascript">
     function filterUsingCategory(selectedCategory) {
-      var id = 0;
       {% for post in posts %}
         var cats = {{ post.tags | jsonify }}
 
-        var postDiv = document.getElementById(++id);
+        var postDiv = document.getElementById("post-{{post.title | slugify}}");
         postDiv.style.display = (selectedCategory == 'All' || cats.includes(selectedCategory))
           ? 'unset'
           : 'none';
@@ -34,10 +33,8 @@ permalink: /posts/
   </div>
 
   <div class="posts-wrapper">
-    {% assign id = 0 %}
     {% for post in posts %}
-      {% assign id = id | plus:1 %}
-      <div class="post" id="{{id}}">
+      <div class="post" id="post-{{post.title | slugify}}">
         <p class="itemInteriorSection">
           {%- unless post.hidden -%}
             {% include archive-single.html %}

From 4ec8ae14bb288a457782a11eef163066f6a6d87b Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Wed, 2 Mar 2022 02:26:58 +0500
Subject: [PATCH 12/20] work

---
 docs/_pages/posts-landing.md                  |  49 ++
 docs/_pages/posts_list_landing.md             |  36 ++
 docs/_sass/minimal-mistakes/_page.scss        | 560 ++++++++++++++++++
 docs/_sass/minimal-mistakes/_variables.scss   | 169 ++++++
 docs/_sass/minimal-mistakes/skins/_air.scss   |  23 +
 docs/assets/css/main.scss                     |   2 +
 ...epspeed-logo-uppercase-bold-white-1.15.svg |  24 +
 .../deepspeed-logo-uppercase-bold-white.svg   |  19 +
 .../images/deepspeed-logo-uppercase-white.svg |  19 +
 9 files changed, 901 insertions(+)
 create mode 100644 docs/_pages/posts-landing.md
 create mode 100644 docs/_pages/posts_list_landing.md
 create mode 100644 docs/_sass/minimal-mistakes/_page.scss
 create mode 100644 docs/_sass/minimal-mistakes/_variables.scss
 create mode 100644 docs/_sass/minimal-mistakes/skins/_air.scss
 create mode 100644 docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg
 create mode 100644 docs/assets/images/deepspeed-logo-uppercase-bold-white.svg
 create mode 100644 docs/assets/images/deepspeed-logo-uppercase-white.svg

diff --git a/docs/_pages/posts-landing.md b/docs/_pages/posts-landing.md
new file mode 100644
index 000000000000..fcbbd46e251c
--- /dev/null
+++ b/docs/_pages/posts-landing.md
@@ -0,0 +1,49 @@
+---
+title: "Blog"
+layout: archive
+permalink: /posts/
+---
+
+{% if paginator %}
+  {% assign posts = paginator.posts %}
+{% else %}
+  {% assign posts = site.posts %}
+{% endif %}
+
+<script type="text/javascript">
+    function filterUsingCategory(selectedCategory) {
+      {% for post in posts %}
+        var cats = {{ post.tags | jsonify }}
+
+        var postDiv = document.getElementById("post-{{post.title | slugify}}");
+        postDiv.style.display = (selectedCategory == 'All' || cats.includes(selectedCategory))
+          ? 'unset'
+          : 'none';
+      {% endfor %}
+    }
+</script>
+
+  <div class="btn-group">
+    <button id="All" class="button-71" role="button" onclick="filterUsingCategory('All')">All ({{ posts.size }})</button>
+    {% assign tags = site.tags | sort %}
+    {% for category in tags %}
+      {% assign cat = category | first %}
+      <button id="{{ cat }}" class="button-71" role="button" onclick="filterUsingCategory(this.id)">{{ cat }} ({{ site.tags[cat].size }})</button>
+    {% endfor %}
+    <hr />
+  </div>
+
+  <div class="posts-wrapper">
+    {% for post in posts %}
+      <div class="post" id="post-{{post.title | slugify}}">
+        <p class="itemInteriorSection">
+          {%- unless post.hidden -%}
+            {% include archive-single.html %}
+            {% if post.image %}
+              <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
+            {% endif %}
+          {%- endunless -%}
+        </p>
+      </div>
+    {% endfor %}
+  </div>
diff --git a/docs/_pages/posts_list_landing.md b/docs/_pages/posts_list_landing.md
new file mode 100644
index 000000000000..207d48a259f2
--- /dev/null
+++ b/docs/_pages/posts_list_landing.md
@@ -0,0 +1,36 @@
+---
+layout: archive
+permalink: /posts-list/
+---
+
+{% assign sorted_tags = (site.tags | sort:0) %}
+<ul class="tag-box">
+	{% for tag in sorted_tags %}
+		{% assign t = tag | first %}
+		{% assign ps = tag | last %}
+		<li><a href="#{{ t | downcase }}">{{ t }} <span class="size">({{ ps.size }})</span></a></li>
+	{% endfor %}
+</ul>
+
+{% for tag in sorted_tags %}
+  {% assign t = tag | first %}
+  {% assign posts = tag | last %}
+  <div style="text-transform:capitalize;">
+    <h4 id="{{ t | downcase }}">{{ t }}</h4>
+  </div>
+  <ul>
+  {% for post in posts %}
+    {% if post.tags contains t %}
+      {% if post.link %}
+        <li>
+          <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.link }}">{{ post.title }}</a>
+        </li>
+      {% else %}
+        <li>
+          <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.url }}">{{ post.title }}</a>
+        </li>
+      {% endif %}
+    {% endif %}
+  {% endfor %}
+  </ul>
+{% endfor %}
diff --git a/docs/_sass/minimal-mistakes/_page.scss b/docs/_sass/minimal-mistakes/_page.scss
new file mode 100644
index 000000000000..06fef675dbb5
--- /dev/null
+++ b/docs/_sass/minimal-mistakes/_page.scss
@@ -0,0 +1,560 @@
+/* ==========================================================================
+   SINGLE PAGE/POST
+   ========================================================================== */
+
+#main {
+  @include clearfix;
+  margin-left: auto;
+  margin-right: auto;
+  padding-left: 1em;
+  padding-right: 1em;
+  -webkit-animation: $intro-transition;
+  animation: $intro-transition;
+  max-width: 100%;
+  -webkit-animation-delay: 0.15s;
+  animation-delay: 0.15s;
+
+  @include breakpoint($x-large) {
+    max-width: $max-width;
+  }
+}
+
+body {
+  display: -webkit-box;
+  display: -ms-flexbox;
+  display: flex;
+  min-height: 100vh;
+  -webkit-box-orient: vertical;
+  -webkit-box-direction: normal;
+  -ms-flex-direction: column;
+          flex-direction: column;
+}
+
+.initial-content,
+.search-content {
+  flex: 1 0 auto;
+}
+
+.page {
+  @include breakpoint($large) {
+    float: right;
+    width: calc(100% - #{$right-sidebar-width-narrow});
+    padding-right: $right-sidebar-width-narrow;
+  }
+
+  @include breakpoint($x-large) {
+    width: calc(100% - #{$right-sidebar-width});
+    padding-right: $right-sidebar-width;
+  }
+
+  .page__inner-wrap {
+    float: left;
+    margin-top: 1em;
+    margin-left: 0;
+    margin-right: 0;
+    width: 100%;
+    clear: both;
+
+    .page__content,
+    .page__meta,
+    .page__share {
+      position: relative;
+      float: left;
+      margin-left: 0;
+      margin-right: 0;
+      width: 100%;
+      clear: both;
+    }
+  }
+}
+
+.page__title {
+  margin-top: 0;
+  line-height: 1.5;
+
+  & + .page__meta {
+    margin-top: -0.5em;
+  }
+}
+
+.page__lead {
+  font-family: $global-font-family;
+  font-size: $type-size-4;
+}
+
+.page__content {
+  h2 {
+    padding-bottom: 0.5em;
+    border-bottom: 1px solid $border-color;
+  }
+
+	h1, h2, h3, h4, h5, h6 {
+		.header-link {
+			position: relative;
+			left: 0.5em;
+			opacity: 0;
+			font-size: 0.8em;
+			-webkit-transition: opacity 0.2s ease-in-out 0.1s;
+			-moz-transition: opacity 0.2s ease-in-out 0.1s;
+			-o-transition: opacity 0.2s ease-in-out 0.1s;
+			transition: opacity 0.2s ease-in-out 0.1s;
+		}
+
+		&:hover .header-link {
+			opacity: 1;
+		}
+	}
+
+  p,
+  li,
+  dl {
+    font-size: 1em;
+    line-height: 1.7777778;
+  }
+
+  /* paragraph indents */
+  p {
+    margin: 0 0 $indent-var;
+
+    /* sibling indentation*/
+    @if $paragraph-indent == true {
+      & + p {
+        text-indent: $indent-var;
+        margin-top: -($indent-var);
+      }
+    }
+  }
+
+  a:not(.btn) {
+    &:hover {
+      text-decoration: underline;
+
+      img {
+        box-shadow: 0 0 10px rgba(#000, 0.25);
+      }
+    }
+  }
+
+  dt {
+    margin-top: 1em;
+    font-family: $sans-serif;
+    font-weight: bold;
+  }
+
+  dd {
+    margin-left: 1em;
+    font-family: $sans-serif;
+    font-size: $type-size-6;
+  }
+
+  .small {
+    font-size: $type-size-6;
+  }
+
+  /* blockquote citations */
+  blockquote + .small {
+    margin-top: -1.5em;
+    padding-left: 1.25rem;
+  }
+}
+
+.page__hero {
+  position: relative;
+  margin-bottom: 2em;
+  @include clearfix;
+  -webkit-animation: $intro-transition;
+  animation: $intro-transition;
+  -webkit-animation-delay: 0.25s;
+  animation-delay: 0.25s;
+
+  &--overlay {
+    position: relative;
+    margin-bottom: 2em;
+    padding: 3em 0;
+    @include clearfix;
+    background-size: cover;
+    background-repeat: no-repeat;
+    background-position: center;
+    -webkit-animation: $intro-transition;
+    animation: $intro-transition;
+    -webkit-animation-delay: 0.25s;
+    animation-delay: 0.25s;
+
+    a {
+      color: #fff;
+    }
+
+    .wrapper {
+      padding-left: 1em;
+      padding-right: 1em;
+
+      @include breakpoint($x-large) {
+        max-width: $x-large;
+      }
+    }
+
+    .page__title,
+    .page__meta,
+    .page__lead,
+    .btn {
+      color: #fff;
+      text-shadow: 1px 1px 4px rgba(#000, 0.5);
+    }
+
+    .page__lead {
+      max-width: $medium;
+    }
+
+    .page__title {
+      font-size: $type-size-2;
+
+      @include breakpoint($small) {
+        font-size: $type-size-1;
+      }
+    }
+  }
+}
+
+.page__hero-image {
+  width: 100%;
+  height: auto;
+  -ms-interpolation-mode: bicubic;
+}
+
+.page__hero-caption {
+  position: absolute;
+  bottom: 0;
+  right: 0;
+  margin: 0 auto;
+  padding: 2px 5px;
+  color: #fff;
+  font-family: $caption-font-family;
+  font-size: $type-size-7;
+  background: #000;
+  text-align: right;
+  z-index: 5;
+  opacity: 0.5;
+  border-radius: $border-radius 0 0 0;
+
+  @include breakpoint($large) {
+    padding: 5px 10px;
+  }
+
+  a {
+    color: #fff;
+    text-decoration: none;
+  }
+}
+
+/*
+   Social sharing
+   ========================================================================== */
+
+.page__share {
+  margin-top: 2em;
+  padding-top: 1em;
+  border-top: 1px solid $border-color;
+
+  @include breakpoint(max-width $small) {
+    .btn span {
+      border: 0;
+      clip: rect(0 0 0 0);
+      height: 1px;
+      margin: -1px;
+      overflow: hidden;
+      padding: 0;
+      position: absolute;
+      width: 1px;
+    }
+  }
+}
+
+.page__share-title {
+  margin-bottom: 10px;
+  font-size: $type-size-6;
+  text-transform: uppercase;
+}
+
+/*
+   Page meta
+   ========================================================================== */
+
+.page__meta {
+  margin-top: 2em;
+  color: $muted-text-color;
+  font-family: $sans-serif;
+  font-size: $type-size-6;
+
+  p {
+    margin: 0;
+  }
+
+  a {
+    color: inherit;
+  }
+}
+
+.page__meta-title {
+  margin-bottom: 10px;
+  font-size: $type-size-6;
+  text-transform: uppercase;
+}
+
+.page__meta-sep::before {
+  content: "\2022";
+  padding-left: 0.5em;
+  padding-right: 0.5em;
+}
+
+/*
+   Page taxonomy
+   ========================================================================== */
+
+.page__taxonomy {
+  .sep {
+    display: none;
+  }
+
+  strong {
+    margin-right: 10px;
+  }
+}
+
+.page__taxonomy-item {
+  display: inline-block;
+  margin-right: 5px;
+  margin-bottom: 8px;
+  padding: 5px 10px;
+  text-decoration: none;
+  border: 1px solid mix(#000, $border-color, 25%);
+  border-radius: $border-radius;
+
+  &:hover {
+    text-decoration: none;
+    color: $link-color-hover;
+  }
+}
+
+.taxonomy__section {
+  margin-bottom: 2em;
+  padding-bottom: 1em;
+
+  &:not(:last-child) {
+    border-bottom: solid 1px $border-color;
+  }
+
+  .archive__item-title {
+    margin-top: 0;
+  }
+
+  .archive__subtitle {
+    clear: both;
+    border: 0;
+  }
+
+  + .taxonomy__section {
+    margin-top: 2em;
+  }
+}
+
+.taxonomy__title {
+  margin-bottom: 0.5em;
+  color: $muted-text-color;
+}
+
+.taxonomy__count {
+  color: $muted-text-color;
+}
+
+.taxonomy__index {
+  display: grid;
+  grid-column-gap: 2em;
+  grid-template-columns: repeat(2, 1fr);
+  margin: 1.414em 0;
+  padding: 0;
+  font-size: 0.75em;
+  list-style: none;
+
+  @include breakpoint($large) {
+    grid-template-columns: repeat(3, 1fr);
+  }
+
+  a {
+    display: -webkit-box;
+    display: -ms-flexbox;
+    display: flex;
+    padding: 0.25em 0;
+    -webkit-box-pack: justify;
+    -ms-flex-pack: justify;
+    justify-content: space-between;
+    color: inherit;
+    text-decoration: none;
+    border-bottom: 1px solid $border-color;
+  }
+}
+
+.back-to-top {
+  display: block;
+  clear: both;
+  color: $muted-text-color;
+  font-size: 0.6em;
+  text-transform: uppercase;
+  text-align: right;
+  text-decoration: none;
+}
+
+/*
+   Comments
+   ========================================================================== */
+
+.page__comments {
+  float: left;
+  margin-left: 0;
+  margin-right: 0;
+  width: 100%;
+  clear: both;
+}
+
+.page__comments-title {
+  margin-top: 2rem;
+  margin-bottom: 10px;
+  padding-top: 2rem;
+  font-size: $type-size-6;
+  border-top: 1px solid $border-color;
+  text-transform: uppercase;
+}
+
+.page__comments-form {
+  -webkit-transition: $global-transition;
+  transition: $global-transition;
+
+  &.disabled {
+    input,
+    button,
+    textarea,
+    label {
+      pointer-events: none;
+      cursor: not-allowed;
+      filter: alpha(opacity=65);
+      box-shadow: none;
+      opacity: 0.65;
+    }
+  }
+}
+
+.comment {
+  @include clearfix();
+  margin: 1em 0;
+
+  &:not(:last-child) {
+    border-bottom: 1px solid $border-color;
+  }
+}
+
+.comment__avatar-wrapper {
+  float: left;
+  width: 60px;
+  height: 60px;
+
+  @include breakpoint($large) {
+    width: 100px;
+    height: 100px;
+  }
+}
+
+.comment__avatar {
+  width: 40px;
+  height: 40px;
+  border-radius: 50%;
+
+  @include breakpoint($large) {
+    width: 80px;
+    height: 80px;
+    padding: 5px;
+    border: 1px solid $border-color;
+  }
+}
+
+.comment__content-wrapper {
+  float: right;
+  width: calc(100% - 60px);
+
+  @include breakpoint($large) {
+    width: calc(100% - 100px);
+  }
+}
+
+.comment__author {
+  margin: 0;
+
+  a {
+    text-decoration: none;
+  }
+}
+
+.comment__date {
+  @extend .page__meta;
+  margin: 0;
+
+  a {
+    text-decoration: none;
+  }
+}
+
+/*
+   Related
+   ========================================================================== */
+
+.page__related {
+  @include clearfix();
+  float: left;
+  margin-top: 2em;
+  padding-top: 1em;
+  border-top: 1px solid $border-color;
+
+  @include breakpoint($large) {
+    float: right;
+    width: calc(100% - #{$right-sidebar-width-narrow});
+  }
+
+  @include breakpoint($x-large) {
+    width: calc(100% - #{$right-sidebar-width});
+  }
+
+  a {
+    color: inherit;
+    text-decoration: none;
+  }
+}
+
+.page__related-title {
+  margin-bottom: 10px;
+  font-size: $type-size-6;
+  text-transform: uppercase;
+}
+
+/*
+   Wide Pages
+   ========================================================================== */
+
+.wide {
+  .page {
+    @include breakpoint($large) {
+      padding-right: 0;
+    }
+
+    @include breakpoint($x-large) {
+      padding-right: 0;
+    }
+  }
+
+  .page__related {
+    @include breakpoint($large) {
+      padding-right: 0;
+    }
+
+    @include breakpoint($x-large) {
+      padding-right: 0;
+    }
+  }
+}
diff --git a/docs/_sass/minimal-mistakes/_variables.scss b/docs/_sass/minimal-mistakes/_variables.scss
new file mode 100644
index 000000000000..f7143ca81364
--- /dev/null
+++ b/docs/_sass/minimal-mistakes/_variables.scss
@@ -0,0 +1,169 @@
+/* ==========================================================================
+   Variables
+   ========================================================================== */
+
+/*
+   Typography
+   ========================================================================== */
+
+$doc-font-size: 12 !default;
+
+/* paragraph indention */
+$paragraph-indent: false !default; // true, false (default)
+$indent-var: 1.3em !default;
+
+/* system typefaces */
+$serif: Georgia, Times, serif !default;
+$sans-serif: -apple-system, BlinkMacSystemFont, "Roboto", "Segoe UI",
+  "Helvetica Neue", "Lucida Grande", Arial, sans-serif !default;
+$monospace: Monaco, Consolas, "Lucida Console", monospace !default;
+
+/* sans serif typefaces */
+$sans-serif-narrow: $sans-serif !default;
+$helvetica: Helvetica, "Helvetica Neue", Arial, sans-serif !default;
+
+/* serif typefaces */
+$georgia: Georgia, serif !default;
+$times: Times, serif !default;
+$bodoni: "Bodoni MT", serif !default;
+$calisto: "Calisto MT", serif !default;
+$garamond: Garamond, serif !default;
+
+$global-font-family: $sans-serif !default;
+$header-font-family: $sans-serif !default;
+$caption-font-family: $serif !default;
+
+/* type scale */
+$type-size-1: 2.441em !default; // ~39.056px
+$type-size-2: 1.953em !default; // ~31.248px
+$type-size-3: 1.563em !default; // ~25.008px
+$type-size-4: 1.25em !default; // ~20px
+$type-size-5: 1em !default; // ~16px
+$type-size-6: 0.75em !default; // ~12px
+$type-size-7: 0.6875em !default; // ~11px
+$type-size-8: 0.625em !default; // ~10px
+
+/* headline scale */
+$h-size-1: 1.563em !default; // ~25.008px
+$h-size-2: 1.25em !default; // ~20px
+$h-size-3: 1.125em !default; // ~18px
+$h-size-4: 1.0625em !default; // ~17px
+$h-size-5: 1.03125em !default; // ~16.5px
+$h-size-6: 1em !default; // ~16px
+
+/*
+   Colors
+   ========================================================================== */
+
+$gray: #7a8288 !default;
+$dark-gray: mix(#000, $gray, 50%) !default;
+$darker-gray: mix(#000, $gray, 60%) !default;
+$light-gray: mix(#fff, $gray, 50%) !default;
+$lighter-gray: mix(#fff, $gray, 90%) !default;
+
+$background-color: #fff !default;
+$code-background-color: #fafafa !default;
+$code-background-color-dark: $light-gray !default;
+$text-color: $dark-gray !default;
+$muted-text-color: mix(#fff, $text-color, 20%) !default;
+$border-color: $lighter-gray !default;
+$form-background-color: $lighter-gray !default;
+$footer-background-color: $lighter-gray !default;
+
+$primary-color: #6f777d !default;
+$success-color: #3fa63f !default;
+$warning-color: #d67f05 !default;
+$danger-color: #ee5f5b !default;
+$info-color: #3b9cba !default;
+$focus-color: $primary-color !default;
+$active-color: mix(#fff, $primary-color, 80%) !default;
+
+/* YIQ color contrast */
+$yiq-contrasted-dark-default: $dark-gray !default;
+$yiq-contrasted-light-default: #fff !default;
+$yiq-contrasted-threshold: 175 !default;
+$yiq-debug: false !default;
+
+/* brands */
+$behance-color: #1769ff !default;
+$bitbucket-color: #205081 !default;
+$dribbble-color: #ea4c89 !default;
+$facebook-color: #3b5998 !default;
+$flickr-color: #ff0084 !default;
+$foursquare-color: #0072b1 !default;
+$github-color: #171516 !default;
+$gitlab-color: #e24329 !default;
+$instagram-color: #517fa4 !default;
+$keybase-color: #ef7639 !default;
+$lastfm-color: #d51007 !default;
+$linkedin-color: #007bb6 !default;
+$mastodon-color: #2b90d9 !default;
+$pinterest-color: #cb2027 !default;
+$reddit-color: #ff4500 !default;
+$rss-color: #fa9b39 !default;
+$soundcloud-color: #ff3300 !default;
+$stackoverflow-color: #fe7a15 !default;
+$tumblr-color: #32506d !default;
+$twitter-color: #55acee !default;
+$vimeo-color: #1ab7ea !default;
+$vine-color: #00bf8f !default;
+$youtube-color: #bb0000 !default;
+$xing-color: #006567 !default;
+
+/* links */
+$link-color: mix(#000, $info-color, 20%) !default;
+$link-color-hover: mix(#000, $link-color, 25%) !default;
+$link-color-visited: mix(#fff, $link-color, 15%) !default;
+$masthead-link-color: $primary-color !default;
+$masthead-link-color-hover: mix(#000, $primary-color, 25%) !default;
+$navicon-link-color-hover: mix(#fff, $primary-color, 75%) !default;
+
+/* syntax highlighting (base16) */
+$base00: #263238 !default;
+$base01: #2e3c43 !default;
+$base02: #314549 !default;
+$base03: #546e7a !default;
+$base04: #b2ccd6 !default;
+$base05: #eeffff !default;
+$base06: #eeffff !default;
+$base07: #ffffff !default;
+$base08: #f07178 !default;
+$base09: #f78c6c !default;
+$base0a: #ffcb6b !default;
+$base0b: #c3e88d !default;
+$base0c: #89ddff !default;
+$base0d: #82aaff !default;
+$base0e: #c792ea !default;
+$base0f: #ff5370 !default;
+
+/*
+   Breakpoints
+   ========================================================================== */
+
+$small: 600px !default;
+$medium: 768px !default;
+$medium-wide: 900px !default;
+$large: 1024px !default;
+$x-large: 1280px !default;
+$max-width: $x-large !default;
+
+/*
+   Grid
+   ========================================================================== */
+
+$right-sidebar-width-narrow: 200px !default;
+$right-sidebar-width: 300px !default;
+$right-sidebar-width-wide: 400px !default;
+
+/*
+   Other
+   ========================================================================== */
+
+$border-radius: 4px !default;
+$box-shadow: 0 1px 1px rgba(0, 0, 0, 0.125) !default;
+$nav-height: 2em !default;
+$nav-toggle-height: 2rem !default;
+$navicon-width: 1.5rem !default;
+$navicon-height: 0.25rem !default;
+$global-transition: all 0.2s ease-in-out !default;
+$intro-transition: intro 0.3s both !default;
diff --git a/docs/_sass/minimal-mistakes/skins/_air.scss b/docs/_sass/minimal-mistakes/skins/_air.scss
new file mode 100644
index 000000000000..662e1451926e
--- /dev/null
+++ b/docs/_sass/minimal-mistakes/skins/_air.scss
@@ -0,0 +1,23 @@
+/* ==========================================================================
+   Air skin
+   ========================================================================== */
+
+/* Colors */
+$background-color: white !default;
+$text-color: #222831 !default;
+$muted-text-color: #393e46 !default;
+$primary-color: #0092ca !default;
+$border-color: mix(#fff, #393e46, 75%) !default;
+$footer-background-color: $primary-color !default;
+$link-color: #393e46 !default;
+$masthead-link-color: $text-color !default;
+$masthead-link-color-hover: $text-color !default;
+$navicon-link-color-hover: mix(#fff, $text-color, 80%) !default;
+
+.page__footer {
+  color: #fff !important; // override
+}
+
+.page__footer-follow .social-icons .svg-inline--fa {
+  color: inherit;
+}
diff --git a/docs/assets/css/main.scss b/docs/assets/css/main.scss
index 5739da82947e..7fccdd65bd30 100644
--- a/docs/assets/css/main.scss
+++ b/docs/assets/css/main.scss
@@ -65,3 +65,5 @@ ul.tag-box li a {
 ul.tag-box li span.size {
   font-weight: bold;
 }
+
+.site-logo img { max-height: 200%; width: auto; }
diff --git a/docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg b/docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg
new file mode 100644
index 000000000000..1cb9f7575a00
--- /dev/null
+++ b/docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg
@@ -0,0 +1,24 @@
+<?xml version="1.0" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.0//EN" "http://www.w3.org/TR/2001/REC-SVG-20010904/DTD/svg10.dtd">
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" id="body_1" width="330" height="100">
+
+<g transform="matrix(1.1494253 0 0 1.1494253 0.057474773 -0)">
+    <path d="M101.619 54.3759L101.619 31.2694L109.805 31.2694C 118.012 31.2694 122.115 35.0238 122.115 42.5326C 122.115 46.1312 120.993 49.0048 118.748 51.1532C 116.513 53.3016 113.532 54.3759 109.805 54.3759L109.805 54.3759L101.619 54.3759zM106.824 35.5072L106.824 50.1542L109.402 50.1542C 111.658 50.1542 113.425 49.4774 114.703 48.1239C 115.992 46.7704 116.637 44.9281 116.637 42.597C 116.637 40.3949 115.998 38.6654 114.719 37.4086C 113.452 36.141 111.669 35.5072 109.37 35.5072L109.37 35.5072L106.824 35.5072zM140.275 47.576L129.511 47.576C 129.683 49.9716 131.193 51.1693 134.039 51.1693C 135.855 51.1693 137.45 50.7396 138.825 49.8802L138.825 49.8802L138.825 53.5541C 137.3 54.3705 135.318 54.7787 132.879 54.7787C 130.215 54.7787 128.147 54.0428 126.676 52.5712C 125.204 51.0887 124.468 49.0262 124.468 46.3837C 124.468 43.6444 125.263 41.4745 126.853 39.8739C 128.443 38.2733 130.398 37.473 132.718 37.473C 135.124 37.473 136.983 38.1874 138.293 39.6161C 139.615 41.0448 140.275 42.9838 140.275 45.433L140.275 45.433L140.275 47.576zM135.554 44.4501C 135.554 42.0868 134.598 40.9052 132.686 40.9052C 131.869 40.9052 131.16 41.2435 130.559 41.9203C 129.968 42.597 129.608 43.4403 129.479 44.4501L129.479 44.4501L135.554 44.4501zM158.129 47.576L147.365 47.576C 147.537 49.9716 149.046 51.1693 151.893 51.1693C 153.708 51.1693 155.303 50.7396 156.678 49.8802L156.678 49.8802L156.678 53.5541C 155.153 54.3705 153.171 54.7787 150.733 54.7787C 148.069 54.7787 146.001 54.0428 144.529 52.5712C 143.057 51.0887 142.322 49.0262 142.322 46.3837C 142.322 43.6444 143.116 41.4745 144.706 39.8739C 146.296 38.2733 148.251 37.473 150.572 37.473C 152.978 37.473 154.836 38.1874 156.147 39.6161C 157.468 41.0448 158.129 42.9838 158.129 45.433L158.129 45.433L158.129 47.576zM153.407 44.4501C 153.407 42.0868 152.451 40.9052 150.539 40.9052C 149.723 40.9052 149.014 41.2435 148.412 41.9203C 147.822 42.597 147.462 43.4403 147.333 44.4501L147.333 44.4501L153.407 44.4501zM166.314 52.4584L166.25 52.4584L166.25 61.9652L161.158 61.9652L161.158 37.8759L166.25 37.8759L166.25 40.3573L166.314 40.3573C 167.571 38.4344 169.338 37.473 171.615 37.473C 173.753 37.473 175.402 38.2089 176.562 39.6805C 177.733 41.1415 178.319 43.1342 178.319 45.6586C 178.319 48.4086 177.636 50.6161 176.272 52.2811C 174.919 53.9462 173.114 54.7787 170.858 54.7787C 168.871 54.7787 167.356 54.0052 166.314 52.4584zM166.169 45.6908L166.169 47.0121C 166.169 48.1508 166.47 49.08 167.072 49.7997C 167.673 50.5194 168.463 50.8793 169.44 50.8793C 170.6 50.8793 171.497 50.4335 172.131 49.5419C 172.776 48.6395 173.098 47.3666 173.098 45.723C 173.098 42.8226 171.97 41.3724 169.714 41.3724C 168.672 41.3724 167.818 41.7699 167.152 42.5648C 166.497 43.349 166.169 44.391 166.169 45.6908zM181.058 53.4896L181.058 48.3334C 181.992 49.1176 183.008 49.7084 184.103 50.1058C 185.199 50.4926 186.305 50.6859 187.423 50.6859C 188.078 50.6859 188.647 50.6268 189.131 50.5087C 189.625 50.3905 190.033 50.2294 190.355 50.0253C 190.688 49.8104 190.935 49.5634 191.096 49.2841C 191.258 48.994 191.338 48.6825 191.338 48.3495C 191.338 47.8983 191.209 47.4955 190.951 47.141C 190.694 46.7865 190.339 46.4589 189.888 46.1581C 189.448 45.8573 188.921 45.5673 188.309 45.288C 187.697 45.0087 187.036 44.724 186.327 44.434C 184.522 43.682 183.174 42.7635 182.282 41.6786C 181.402 40.5936 180.961 39.2831 180.961 37.7469C 180.961 36.5438 181.203 35.5126 181.686 34.6532C 182.17 33.7831 182.825 33.0687 183.652 32.5101C 184.49 31.9515 185.457 31.5433 186.552 31.2855C 187.648 31.017 188.808 30.8827 190.033 30.8827C 191.236 30.8827 192.3 30.9579 193.223 31.1083C 194.158 31.2479 195.017 31.4681 195.802 31.7689L195.802 31.7689L195.802 36.5868C 195.415 36.3182 194.99 36.0819 194.529 35.8778C 194.077 35.6737 193.61 35.5072 193.127 35.3783C 192.643 35.2386 192.16 35.1366 191.677 35.0721C 191.204 35.0077 190.753 34.9755 190.323 34.9755C 189.732 34.9755 189.195 35.0345 188.712 35.1527C 188.228 35.2601 187.82 35.4159 187.487 35.62C 187.154 35.8241 186.896 36.0712 186.714 36.3612C 186.531 36.6405 186.44 36.9574 186.44 37.3119C 186.44 37.6986 186.542 38.0477 186.746 38.3593C 186.95 38.66 187.24 38.9501 187.616 39.2294C 187.992 39.4979 188.448 39.7665 188.986 40.035C 189.523 40.2928 190.13 40.5614 190.806 40.8407C 191.73 41.2274 192.557 41.641 193.288 42.0814C 194.029 42.5111 194.663 42.9999 195.189 43.5477C 195.716 44.0956 196.118 44.724 196.398 45.433C 196.677 46.1312 196.817 46.9476 196.817 47.8822C 196.817 49.1713 196.57 50.2562 196.075 51.1371C 195.592 52.0072 194.931 52.7162 194.094 53.264C 193.256 53.8011 192.278 54.1879 191.161 54.4242C 190.054 54.6605 188.884 54.7787 187.648 54.7787C 186.381 54.7787 185.172 54.6713 184.023 54.4564C 182.884 54.2416 181.896 53.9193 181.058 53.4896zM205.276 52.4584L205.212 52.4584L205.212 61.9652L200.12 61.9652L200.12 37.8759L205.212 37.8759L205.212 40.3573L205.276 40.3573C 206.533 38.4344 208.3 37.473 210.577 37.473C 212.715 37.473 214.364 38.2089 215.524 39.6805C 216.695 41.1415 217.281 43.1342 217.281 45.6586C 217.281 48.4086 216.598 50.6161 215.234 52.2811C 213.881 53.9462 212.076 54.7787 209.82 54.7787C 207.833 54.7787 206.318 54.0052 205.276 52.4584zM205.131 45.6908L205.131 47.0121C 205.131 48.1508 205.432 49.08 206.033 49.7997C 206.635 50.5194 207.425 50.8793 208.402 50.8793C 209.562 50.8793 210.459 50.4335 211.093 49.5419C 211.738 48.6395 212.06 47.3666 212.06 45.723C 212.06 42.8226 210.932 41.3724 208.676 41.3724C 207.634 41.3724 206.78 41.7699 206.114 42.5648C 205.459 43.349 205.131 44.391 205.131 45.6908zM235.408 47.576L224.644 47.576C 224.816 49.9716 226.325 51.1693 229.172 51.1693C 230.988 51.1693 232.583 50.7396 233.958 49.8802L233.958 49.8802L233.958 53.5541C 232.432 54.3705 230.45 54.7787 228.012 54.7787C 225.348 54.7787 223.28 54.0428 221.808 52.5712C 220.337 51.0887 219.601 49.0262 219.601 46.3837C 219.601 43.6444 220.396 41.4745 221.986 39.8739C 223.575 38.2733 225.531 37.473 227.851 37.473C 230.257 37.473 232.115 38.1874 233.426 39.6161C 234.747 41.0448 235.408 42.9838 235.408 45.433L235.408 45.433L235.408 47.576zM230.687 44.4501C 230.687 42.0868 229.731 40.9052 227.819 40.9052C 227.002 40.9052 226.293 41.2435 225.692 41.9203C 225.101 42.597 224.741 43.4403 224.612 44.4501L224.612 44.4501L230.687 44.4501zM253.261 47.576L242.498 47.576C 242.67 49.9716 244.179 51.1693 247.026 51.1693C 248.841 51.1693 250.436 50.7396 251.811 49.8802L251.811 49.8802L251.811 53.5541C 250.286 54.3705 248.304 54.7787 245.865 54.7787C 243.201 54.7787 241.134 54.0428 239.662 52.5712C 238.19 51.0887 237.454 49.0262 237.454 46.3837C 237.454 43.6444 238.249 41.4745 239.839 39.8739C 241.429 38.2733 243.384 37.473 245.704 37.473C 248.111 37.473 249.969 38.1874 251.28 39.6161C 252.601 41.0448 253.261 42.9838 253.261 45.433L253.261 45.433L253.261 47.576zM248.54 44.4501C 248.54 42.0868 247.584 40.9052 245.672 40.9052C 244.856 40.9052 244.147 41.2435 243.545 41.9203C 242.954 42.597 242.594 43.4403 242.466 44.4501L242.466 44.4501L248.54 44.4501zM272.436 54.3759L267.344 54.3759L267.344 52.1039L267.28 52.1039C 266.12 53.8871 264.417 54.7787 262.172 54.7787C 260.11 54.7787 258.45 54.0536 257.193 52.6034C 255.936 51.1425 255.308 49.1068 255.308 46.4965C 255.308 43.7679 256.001 41.5819 257.386 39.9384C 258.772 38.2948 260.588 37.473 262.833 37.473C 264.96 37.473 266.442 38.2357 267.28 39.7611L267.28 39.7611L267.344 39.7611L267.344 29.9481L272.436 29.9481L272.436 54.3759zM267.441 46.3514L267.441 45.1107C 267.441 44.0365 267.13 43.1449 266.507 42.4359C 265.884 41.7269 265.073 41.3724 264.073 41.3724C 262.946 41.3724 262.065 41.8182 261.431 42.7098C 260.797 43.5907 260.48 44.8046 260.48 46.3514C 260.48 47.8016 260.786 48.9188 261.399 49.703C 262.011 50.4872 262.86 50.8793 263.945 50.8793C 264.976 50.8793 265.814 50.4657 266.458 49.6385C 267.114 48.8114 267.441 47.7157 267.441 46.3514z" stroke="none" fill="#000000" fill-rule="nonzero" />
+    <path d="M39.1268 56.5563C 41.4335 54.2496 44.6392 53.7153 46.2868 55.363C 47.9345 57.0106 47.4002 60.2163 45.0935 62.523C 42.7868 64.8297 28.9835 72.6663 28.9835 72.6663C 28.9835 72.6663 36.8201 58.863 39.1268 56.5563z" stroke="none" fill="#FFC60F" fill-rule="nonzero" />
+    <path transform="matrix(0.70710677 0.7071067 -0.7071067 0.70710677 31.681961 -24.233828)"  d="M48.89097 26.1266C 48.89097 27.17516 48.52025 28.070162 47.778805 28.811605C 47.03736 29.55305 46.142357 29.92377 45.0938 29.92377C 44.045242 29.92377 43.150238 29.55305 42.408794 28.811605C 41.66735 28.070162 41.29663 27.17516 41.29663 26.1266C 41.29663 25.078041 41.66735 24.18304 42.408794 23.441595C 43.150238 22.700151 44.045242 22.32943 45.0938 22.32943C 46.142357 22.32943 47.03736 22.700151 47.778805 23.441595C 48.52025 24.18304 48.89097 25.078041 48.89097 26.1266C 48.89097 26.170788 48.890198 26.214962 48.888657 26.259119" stroke="none" fill="#F17F00" fill-rule="nonzero" />
+    <path transform="matrix(0.70710677 0.7071067 -0.7071067 0.70710677 47.19536 -30.65969)"  d="M64.40437 41.64C 64.40437 42.68856 64.03365 43.58356 63.292206 44.325005C 62.550766 45.06645 61.65576 45.437172 60.6072 45.43717C 59.558643 45.437172 58.663643 45.06645 57.922195 44.325005C 57.180756 43.58356 56.810036 42.68856 56.81003 41.64C 56.810036 40.591442 57.180756 39.69644 57.922195 38.954994C 58.663643 38.213554 59.558643 37.84283 60.6072 37.84283C 61.65576 37.84283 62.550766 38.213554 63.292206 38.954994C 64.03365 39.69644 64.40437 40.591442 64.40437 41.64C 64.40437 41.68419 64.4036 41.728363 64.402054 41.77252" stroke="none" fill="#F17F00" fill-rule="nonzero" />
+    <path transform="matrix(0.70710677 0.7071067 -0.7071067 0.70710677 37.55661 -53.92969)"  d="M87.67437 18.37C 87.67437 19.41856 87.30365 20.313562 86.5622 21.055006C 85.820755 21.79645 84.92576 22.167171 83.8772 22.167171C 82.82864 22.167171 81.93364 21.79645 81.19219 21.055006C 80.450745 20.313562 80.080025 19.41856 80.080025 18.37C 80.080025 17.321442 80.450745 16.426441 81.19219 15.684997C 81.93364 14.943554 82.82864 14.572832 83.8772 14.572831C 84.92576 14.572832 85.820755 14.943554 86.5622 15.684997C 87.30365 16.426441 87.67437 17.321442 87.67437 18.37C 87.67437 18.414188 87.6736 18.45836 87.67205 18.50252" stroke="none" fill="#F17F00" fill-rule="nonzero" />
+    <path transform="matrix(0.70710677 0.7071067 -0.7071067 0.70710677 45.08051 -17.200996)"  d="M47.10087 45.8165C 47.10087 46.86506 46.73015 47.760063 45.988705 48.501507C 45.24726 49.24295 44.352257 49.613674 43.3037 49.61367C 42.255142 49.613674 41.36014 49.24295 40.618694 48.501507C 39.877254 47.760063 39.50653 46.86506 39.50653 45.8165C 39.50653 44.767944 39.877254 43.872944 40.618694 43.131496C 41.36014 42.390057 42.255142 42.019333 43.3037 42.019333C 44.352257 42.019333 45.24726 42.390057 45.988705 43.131496C 46.73015 43.872944 47.10087 44.767944 47.10087 45.8165C 47.10087 45.860687 47.100098 45.90486 47.098557 45.94902" stroke="none" fill="#F17F00" fill-rule="nonzero" />
+    <path transform="matrix(0.70710677 0.7071067 -0.7071067 0.70710677 62.11236 -36.838516)"  d="M79.32137 56.557C 79.32137 57.60556 78.95065 58.500565 78.209206 59.242004C 77.46776 59.98345 76.57276 60.35417 75.5242 60.354168C 74.47565 60.35417 73.58064 59.98345 72.839195 59.242004C 72.09775 58.500565 71.72703 57.60556 71.72703 56.557C 71.72703 55.508442 72.09775 54.61344 72.839195 53.871994C 73.58064 53.130554 74.47565 52.759834 75.5242 52.75983C 76.57276 52.759834 77.46776 53.130554 78.209206 53.871994C 78.95065 54.61344 79.32137 55.508442 79.32137 56.557C 79.32137 56.60119 79.3206 56.645363 79.31905 56.689518" stroke="none" fill="#F17F00" fill-rule="nonzero" />
+    <path transform="matrix(0.70710677 0.7071067 -0.7071067 0.70710677 57.610943 -22.391335)"  d="M59.63137 58.3469C 59.631374 59.395462 59.26065 60.290466 58.519207 61.031906C 57.777763 61.773354 56.882763 62.144073 55.8342 62.14407C 54.785645 62.144073 53.890644 61.773354 53.149197 61.031906C 52.407757 60.290466 52.037033 59.395462 52.037033 58.3469C 52.037033 57.298344 52.407757 56.403343 53.149197 55.661896C 53.890644 54.920456 54.785645 54.549736 55.8342 54.549732C 56.882763 54.549736 57.777763 54.920456 58.519207 55.661896C 59.26065 56.403343 59.631374 57.298344 59.63137 58.3469C 59.631374 58.39109 59.630604 58.435265 59.62906 58.47942" stroke="none" fill="#F17F00" fill-rule="nonzero" />
+    <path d="M44.9435 26.2895L83.8057 18.3551" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M75.3605 57.0021L83.8786 18.2091" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M45.4887 25.6734L43.4618 45.8914" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M43.1252 45.6813L61.0254 41.2893" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M61.1444 41.1853L56.1741 58.7838" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M55.7643 58.0542L75.8159 56.1765" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M55.4005 58.5749L44.9725 25.8883" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M75.6647 56.5722L43.083 46.5333" stroke="#F17F00" stroke-width="1.5" fill="none" />
+    <path d="M60.3182 41.4698L83.8676 18.2344" stroke="#F17F00" stroke-width="1.5" fill="none" />
+</g>
+</svg>
\ No newline at end of file
diff --git a/docs/assets/images/deepspeed-logo-uppercase-bold-white.svg b/docs/assets/images/deepspeed-logo-uppercase-bold-white.svg
new file mode 100644
index 000000000000..32395acc8dc8
--- /dev/null
+++ b/docs/assets/images/deepspeed-logo-uppercase-bold-white.svg
@@ -0,0 +1,19 @@
+<svg width="287" height="87" viewBox="0 0 287 87" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M101.619 54.3759V31.2694H109.805C118.012 31.2694 122.115 35.0238 122.115 42.5326C122.115 46.1312 120.993 49.0048 118.748 51.1532C116.513 53.3016 113.532 54.3759 109.805 54.3759H101.619ZM106.824 35.5072V50.1542H109.402C111.658 50.1542 113.425 49.4774 114.703 48.1239C115.992 46.7704 116.637 44.9281 116.637 42.597C116.637 40.3949 115.998 38.6654 114.719 37.4086C113.452 36.141 111.669 35.5072 109.37 35.5072H106.824ZM140.275 47.576H129.511C129.683 49.9716 131.193 51.1693 134.039 51.1693C135.855 51.1693 137.45 50.7396 138.825 49.8802V53.5541C137.3 54.3705 135.318 54.7787 132.879 54.7787C130.215 54.7787 128.147 54.0428 126.676 52.5712C125.204 51.0887 124.468 49.0262 124.468 46.3837C124.468 43.6444 125.263 41.4745 126.853 39.8739C128.443 38.2733 130.398 37.473 132.718 37.473C135.124 37.473 136.983 38.1874 138.293 39.6161C139.615 41.0448 140.275 42.9838 140.275 45.433V47.576ZM135.554 44.4501C135.554 42.0868 134.598 40.9052 132.686 40.9052C131.869 40.9052 131.16 41.2435 130.559 41.9203C129.968 42.597 129.608 43.4403 129.479 44.4501H135.554ZM158.129 47.576H147.365C147.537 49.9716 149.046 51.1693 151.893 51.1693C153.708 51.1693 155.303 50.7396 156.678 49.8802V53.5541C155.153 54.3705 153.171 54.7787 150.733 54.7787C148.069 54.7787 146.001 54.0428 144.529 52.5712C143.057 51.0887 142.322 49.0262 142.322 46.3837C142.322 43.6444 143.116 41.4745 144.706 39.8739C146.296 38.2733 148.251 37.473 150.572 37.473C152.978 37.473 154.836 38.1874 156.147 39.6161C157.468 41.0448 158.129 42.9838 158.129 45.433V47.576ZM153.407 44.4501C153.407 42.0868 152.451 40.9052 150.539 40.9052C149.723 40.9052 149.014 41.2435 148.412 41.9203C147.822 42.597 147.462 43.4403 147.333 44.4501H153.407ZM166.314 52.4584H166.25V61.9652H161.158V37.8759H166.25V40.3573H166.314C167.571 38.4344 169.338 37.473 171.615 37.473C173.753 37.473 175.402 38.2089 176.562 39.6805C177.733 41.1415 178.319 43.1342 178.319 45.6586C178.319 48.4086 177.636 50.6161 176.272 52.2811C174.919 53.9462 173.114 54.7787 170.858 54.7787C168.871 54.7787 167.356 54.0052 166.314 52.4584ZM166.169 45.6908V47.0121C166.169 48.1508 166.47 49.08 167.072 49.7997C167.673 50.5194 168.463 50.8793 169.44 50.8793C170.6 50.8793 171.497 50.4335 172.131 49.5419C172.776 48.6395 173.098 47.3666 173.098 45.723C173.098 42.8226 171.97 41.3724 169.714 41.3724C168.672 41.3724 167.818 41.7699 167.152 42.5648C166.497 43.349 166.169 44.391 166.169 45.6908ZM181.058 53.4896V48.3334C181.992 49.1176 183.008 49.7084 184.103 50.1058C185.199 50.4926 186.305 50.6859 187.423 50.6859C188.078 50.6859 188.647 50.6268 189.131 50.5087C189.625 50.3905 190.033 50.2294 190.355 50.0253C190.688 49.8104 190.935 49.5634 191.096 49.2841C191.258 48.994 191.338 48.6825 191.338 48.3495C191.338 47.8983 191.209 47.4955 190.951 47.141C190.694 46.7865 190.339 46.4589 189.888 46.1581C189.448 45.8573 188.921 45.5673 188.309 45.288C187.697 45.0087 187.036 44.724 186.327 44.434C184.522 43.682 183.174 42.7635 182.282 41.6786C181.402 40.5936 180.961 39.2831 180.961 37.7469C180.961 36.5438 181.203 35.5126 181.686 34.6532C182.17 33.7831 182.825 33.0687 183.652 32.5101C184.49 31.9515 185.457 31.5433 186.552 31.2855C187.648 31.017 188.808 30.8827 190.033 30.8827C191.236 30.8827 192.3 30.9579 193.223 31.1083C194.158 31.2479 195.017 31.4681 195.802 31.7689V36.5868C195.415 36.3182 194.99 36.0819 194.529 35.8778C194.077 35.6737 193.61 35.5072 193.127 35.3783C192.643 35.2386 192.16 35.1366 191.677 35.0721C191.204 35.0077 190.753 34.9755 190.323 34.9755C189.732 34.9755 189.195 35.0345 188.712 35.1527C188.228 35.2601 187.82 35.4159 187.487 35.62C187.154 35.8241 186.896 36.0712 186.714 36.3612C186.531 36.6405 186.44 36.9574 186.44 37.3119C186.44 37.6986 186.542 38.0477 186.746 38.3593C186.95 38.66 187.24 38.9501 187.616 39.2294C187.992 39.4979 188.448 39.7665 188.986 40.035C189.523 40.2928 190.13 40.5614 190.806 40.8407C191.73 41.2274 192.557 41.641 193.288 42.0814C194.029 42.5111 194.663 42.9999 195.189 43.5477C195.716 44.0956 196.118 44.724 196.398 45.433C196.677 46.1312 196.817 46.9476 196.817 47.8822C196.817 49.1713 196.57 50.2562 196.075 51.1371C195.592 52.0072 194.931 52.7162 194.094 53.264C193.256 53.8011 192.278 54.1879 191.161 54.4242C190.054 54.6605 188.884 54.7787 187.648 54.7787C186.381 54.7787 185.172 54.6713 184.023 54.4564C182.884 54.2416 181.896 53.9193 181.058 53.4896ZM205.276 52.4584H205.212V61.9652H200.12V37.8759H205.212V40.3573H205.276C206.533 38.4344 208.3 37.473 210.577 37.473C212.715 37.473 214.364 38.2089 215.524 39.6805C216.695 41.1415 217.281 43.1342 217.281 45.6586C217.281 48.4086 216.598 50.6161 215.234 52.2811C213.881 53.9462 212.076 54.7787 209.82 54.7787C207.833 54.7787 206.318 54.0052 205.276 52.4584ZM205.131 45.6908V47.0121C205.131 48.1508 205.432 49.08 206.033 49.7997C206.635 50.5194 207.425 50.8793 208.402 50.8793C209.562 50.8793 210.459 50.4335 211.093 49.5419C211.738 48.6395 212.06 47.3666 212.06 45.723C212.06 42.8226 210.932 41.3724 208.676 41.3724C207.634 41.3724 206.78 41.7699 206.114 42.5648C205.459 43.349 205.131 44.391 205.131 45.6908ZM235.408 47.576H224.644C224.816 49.9716 226.325 51.1693 229.172 51.1693C230.988 51.1693 232.583 50.7396 233.958 49.8802V53.5541C232.432 54.3705 230.45 54.7787 228.012 54.7787C225.348 54.7787 223.28 54.0428 221.808 52.5712C220.337 51.0887 219.601 49.0262 219.601 46.3837C219.601 43.6444 220.396 41.4745 221.986 39.8739C223.575 38.2733 225.531 37.473 227.851 37.473C230.257 37.473 232.115 38.1874 233.426 39.6161C234.747 41.0448 235.408 42.9838 235.408 45.433V47.576ZM230.687 44.4501C230.687 42.0868 229.731 40.9052 227.819 40.9052C227.002 40.9052 226.293 41.2435 225.692 41.9203C225.101 42.597 224.741 43.4403 224.612 44.4501H230.687ZM253.261 47.576H242.498C242.67 49.9716 244.179 51.1693 247.026 51.1693C248.841 51.1693 250.436 50.7396 251.811 49.8802V53.5541C250.286 54.3705 248.304 54.7787 245.865 54.7787C243.201 54.7787 241.134 54.0428 239.662 52.5712C238.19 51.0887 237.454 49.0262 237.454 46.3837C237.454 43.6444 238.249 41.4745 239.839 39.8739C241.429 38.2733 243.384 37.473 245.704 37.473C248.111 37.473 249.969 38.1874 251.28 39.6161C252.601 41.0448 253.261 42.9838 253.261 45.433V47.576ZM248.54 44.4501C248.54 42.0868 247.584 40.9052 245.672 40.9052C244.856 40.9052 244.147 41.2435 243.545 41.9203C242.954 42.597 242.594 43.4403 242.466 44.4501H248.54ZM272.436 54.3759H267.344V52.1039H267.28C266.12 53.8871 264.417 54.7787 262.172 54.7787C260.11 54.7787 258.45 54.0536 257.193 52.6034C255.936 51.1425 255.308 49.1068 255.308 46.4965C255.308 43.7679 256.001 41.5819 257.386 39.9384C258.772 38.2948 260.588 37.473 262.833 37.473C264.96 37.473 266.442 38.2357 267.28 39.7611H267.344V29.9481H272.436V54.3759ZM267.441 46.3514V45.1107C267.441 44.0365 267.13 43.1449 266.507 42.4359C265.884 41.7269 265.073 41.3724 264.073 41.3724C262.946 41.3724 262.065 41.8182 261.431 42.7098C260.797 43.5907 260.48 44.8046 260.48 46.3514C260.48 47.8016 260.786 48.9188 261.399 49.703C262.011 50.4872 262.86 50.8793 263.945 50.8793C264.976 50.8793 265.814 50.4657 266.458 49.6385C267.114 48.8114 267.441 47.7157 267.441 46.3514Z" fill="black"/>
+<path d="M39.1268 56.5563C41.4335 54.2496 44.6392 53.7153 46.2868 55.363C47.9345 57.0106 47.4002 60.2163 45.0935 62.523C42.7868 64.8297 28.9835 72.6663 28.9835 72.6663C28.9835 72.6663 36.8201 58.863 39.1268 56.5563Z" fill="#FFC60F"/>
+<circle cx="45.0938" cy="26.1266" r="3.79717" transform="rotate(45 45.0938 26.1266)" fill="#F17F00"/>
+<circle cx="60.6072" cy="41.64" r="3.79717" transform="rotate(45 60.6072 41.64)" fill="#F17F00"/>
+<circle cx="83.8772" cy="18.37" r="3.79717" transform="rotate(45 83.8772 18.37)" fill="#F17F00"/>
+<circle cx="43.3037" cy="45.8165" r="3.79717" transform="rotate(45 43.3037 45.8165)" fill="#F17F00"/>
+<circle cx="75.5242" cy="56.557" r="3.79717" transform="rotate(45 75.5242 56.557)" fill="#F17F00"/>
+<circle cx="55.8342" cy="58.3469" r="3.79717" transform="rotate(45 55.8342 58.3469)" fill="#F17F00"/>
+<line x1="44.9435" y1="26.2895" x2="83.8057" y2="18.3551" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="75.3605" y1="57.0021" x2="83.8786" y2="18.2091" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="45.4887" y1="25.6734" x2="43.4618" y2="45.8914" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="43.1252" y1="45.6813" x2="61.0254" y2="41.2893" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="61.1444" y1="41.1853" x2="56.1741" y2="58.7838" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="55.7643" y1="58.0542" x2="75.8159" y2="56.1765" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="55.4005" y1="58.5749" x2="44.9725" y2="25.8883" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="75.6647" y1="56.5722" x2="43.083" y2="46.5333" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="60.3182" y1="41.4698" x2="83.8676" y2="18.2344" stroke="#F17F00" stroke-width="1.5"/>
+</svg>
diff --git a/docs/assets/images/deepspeed-logo-uppercase-white.svg b/docs/assets/images/deepspeed-logo-uppercase-white.svg
new file mode 100644
index 000000000000..1fc99199f8d6
--- /dev/null
+++ b/docs/assets/images/deepspeed-logo-uppercase-white.svg
@@ -0,0 +1,19 @@
+<svg width="287" height="107" viewBox="0 0 287 107" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M102.006 63.3759V40.2694H108.387C116.53 40.2694 120.601 44.0238 120.601 51.5326C120.601 55.099 119.468 57.9672 117.201 60.1371C114.945 62.2963 111.921 63.3759 108.129 63.3759H102.006ZM104.713 42.7186V60.9266H108.161C111.191 60.9266 113.549 60.1156 115.235 58.4935C116.922 56.8715 117.765 54.5726 117.765 51.597C117.765 45.6781 114.617 42.7186 108.323 42.7186H104.713ZM138.052 55.7865H126.402C126.445 57.6234 126.939 59.0414 127.884 60.0404C128.829 61.0394 130.129 61.5389 131.783 61.5389C133.642 61.5389 135.35 60.9266 136.907 59.702V62.1835C135.457 63.2362 133.54 63.7626 131.155 63.7626C128.824 63.7626 126.992 63.016 125.66 61.5228C124.328 60.0189 123.662 57.9081 123.662 55.1903C123.662 52.6229 124.387 50.5336 125.838 48.9222C127.299 47.3002 129.109 46.4891 131.268 46.4891C133.427 46.4891 135.097 47.1874 136.279 48.5839C137.461 49.9803 138.052 51.9193 138.052 54.4008V55.7865ZM135.344 53.5468C135.334 52.0214 134.963 50.8344 134.233 49.9857C133.513 49.1371 132.509 48.7128 131.219 48.7128C129.973 48.7128 128.915 49.1586 128.045 50.0502C127.175 50.9418 126.638 52.1073 126.434 53.5468H135.344ZM155.325 55.7865H143.675C143.718 57.6234 144.212 59.0414 145.157 60.0404C146.103 61.0394 147.403 61.5389 149.057 61.5389C150.915 61.5389 152.623 60.9266 154.181 59.702V62.1835C152.731 63.2362 150.813 63.7626 148.428 63.7626C146.097 63.7626 144.266 63.016 142.934 61.5228C141.602 60.0189 140.936 57.9081 140.936 55.1903C140.936 52.6229 141.661 50.5336 143.111 48.9222C144.572 47.3002 146.382 46.4891 148.541 46.4891C150.7 46.4891 152.371 47.1874 153.552 48.5839C154.734 49.9803 155.325 51.9193 155.325 54.4008V55.7865ZM152.618 53.5468C152.607 52.0214 152.237 50.8344 151.506 49.9857C150.786 49.1371 149.782 48.7128 148.493 48.7128C147.247 48.7128 146.189 49.1586 145.319 50.0502C144.448 50.9418 143.911 52.1073 143.707 53.5468H152.618ZM162.044 60.9911H161.98V70.9652H159.337V46.8759H161.98V49.7762H162.044C163.344 47.5848 165.245 46.4891 167.748 46.4891C169.875 46.4891 171.535 47.2303 172.727 48.7128C173.92 50.1844 174.516 52.161 174.516 54.6425C174.516 57.4032 173.844 59.6161 172.502 61.2811C171.159 62.9354 169.322 63.7626 166.991 63.7626C164.853 63.7626 163.204 62.8387 162.044 60.9911ZM161.98 54.3363V56.6405C161.98 58.0048 162.42 59.1649 163.301 60.121C164.193 61.0663 165.321 61.5389 166.685 61.5389C168.285 61.5389 169.537 60.9266 170.439 59.702C171.352 58.4774 171.809 56.7748 171.809 54.5941C171.809 52.7572 171.385 51.3177 170.536 50.2758C169.687 49.2338 168.538 48.7128 167.088 48.7128C165.552 48.7128 164.316 49.2499 163.382 50.3241C162.447 51.3876 161.98 52.725 161.98 54.3363ZM178.012 62.4413V59.2509C178.378 59.5731 178.813 59.8632 179.318 60.121C179.833 60.3788 180.37 60.599 180.929 60.7816C181.498 60.9535 182.068 61.0878 182.637 61.1844C183.206 61.2811 183.733 61.3295 184.216 61.3295C185.881 61.3295 187.122 61.0233 187.938 60.411C188.765 59.788 189.179 58.8964 189.179 57.7362C189.179 57.1132 189.039 56.5707 188.76 56.1088C188.491 55.6469 188.115 55.2279 187.632 54.8519C187.149 54.4652 186.574 54.1 185.908 53.7562C185.253 53.4017 184.544 53.0311 183.781 52.6444C182.975 52.2362 182.223 51.8226 181.525 51.4037C180.827 50.9847 180.22 50.5228 179.704 50.0179C179.189 49.5131 178.781 48.9437 178.48 48.3099C178.19 47.6654 178.045 46.9135 178.045 46.0541C178.045 45.0013 178.276 44.0883 178.738 43.3148C179.199 42.5306 179.806 41.8861 180.558 41.3812C181.31 40.8763 182.164 40.5004 183.12 40.2533C184.087 40.0062 185.07 39.8827 186.069 39.8827C188.346 39.8827 190.006 40.1566 191.048 40.7045V43.7499C189.684 42.8046 187.933 42.3319 185.795 42.3319C185.204 42.3319 184.614 42.3964 184.023 42.5253C183.432 42.6434 182.906 42.8422 182.444 43.1215C181.982 43.4008 181.606 43.7606 181.316 44.201C181.026 44.6415 180.881 45.1786 180.881 45.8124C180.881 46.4032 180.988 46.9135 181.203 47.3431C181.428 47.7728 181.756 48.1649 182.186 48.5194C182.615 48.8739 183.136 49.2177 183.749 49.5507C184.372 49.8837 185.086 50.2489 185.892 50.6464C186.719 51.0546 187.503 51.4843 188.244 51.9354C188.986 52.3866 189.635 52.8861 190.194 53.434C190.753 53.9818 191.193 54.5887 191.515 55.2548C191.848 55.9208 192.015 56.6835 192.015 57.5428C192.015 58.6815 191.789 59.6483 191.338 60.4432C190.898 61.2274 190.296 61.8666 189.533 62.3607C188.781 62.8549 187.911 63.2094 186.923 63.4242C185.935 63.6498 184.893 63.7626 183.797 63.7626C183.432 63.7626 182.981 63.7303 182.444 63.6659C181.906 63.6122 181.359 63.5262 180.8 63.4081C180.241 63.3007 179.71 63.1664 179.205 63.0052C178.711 62.8334 178.313 62.6454 178.012 62.4413ZM198.976 60.9911H198.911V70.9652H196.269V46.8759H198.911V49.7762H198.976C200.276 47.5848 202.177 46.4891 204.68 46.4891C206.807 46.4891 208.467 47.2303 209.659 48.7128C210.851 50.1844 211.448 52.161 211.448 54.6425C211.448 57.4032 210.776 59.6161 209.433 61.2811C208.091 62.9354 206.254 63.7626 203.923 63.7626C201.785 63.7626 200.136 62.8387 198.976 60.9911ZM198.911 54.3363V56.6405C198.911 58.0048 199.352 59.1649 200.233 60.121C201.124 61.0663 202.252 61.5389 203.616 61.5389C205.217 61.5389 206.469 60.9266 207.371 59.702C208.284 58.4774 208.74 56.7748 208.74 54.5941C208.74 52.7572 208.316 51.3177 207.468 50.2758C206.619 49.2338 205.469 48.7128 204.019 48.7128C202.483 48.7128 201.248 49.2499 200.313 50.3241C199.379 51.3876 198.911 52.725 198.911 54.3363ZM228.93 55.7865H217.281C217.323 57.6234 217.818 59.0414 218.763 60.0404C219.708 61.0394 221.008 61.5389 222.662 61.5389C224.521 61.5389 226.229 60.9266 227.786 59.702V62.1835C226.336 63.2362 224.419 63.7626 222.034 63.7626C219.703 63.7626 217.871 63.016 216.539 61.5228C215.207 60.0189 214.541 57.9081 214.541 55.1903C214.541 52.6229 215.266 50.5336 216.717 48.9222C218.177 47.3002 219.988 46.4891 222.147 46.4891C224.306 46.4891 225.976 47.1874 227.158 48.5839C228.34 49.9803 228.93 51.9193 228.93 54.4008V55.7865ZM226.223 53.5468C226.213 52.0214 225.842 50.8344 225.112 49.9857C224.392 49.1371 223.387 48.7128 222.098 48.7128C220.852 48.7128 219.794 49.1586 218.924 50.0502C218.054 50.9418 217.517 52.1073 217.313 53.5468H226.223ZM246.204 55.7865H234.554C234.597 57.6234 235.091 59.0414 236.036 60.0404C236.982 61.0394 238.281 61.5389 239.936 61.5389C241.794 61.5389 243.502 60.9266 245.06 59.702V62.1835C243.61 63.2362 241.692 63.7626 239.307 63.7626C236.976 63.7626 235.145 63.016 233.813 61.5228C232.481 60.0189 231.815 57.9081 231.815 55.1903C231.815 52.6229 232.54 50.5336 233.99 48.9222C235.451 47.3002 237.261 46.4891 239.42 46.4891C241.579 46.4891 243.25 47.1874 244.431 48.5839C245.613 49.9803 246.204 51.9193 246.204 54.4008V55.7865ZM243.497 53.5468C243.486 52.0214 243.115 50.8344 242.385 49.9857C241.665 49.1371 240.661 48.7128 239.372 48.7128C238.126 48.7128 237.068 49.1586 236.198 50.0502C235.327 50.9418 234.79 52.1073 234.586 53.5468H243.497ZM264.299 63.3759H261.656V60.5721H261.592C260.367 62.6991 258.477 63.7626 255.92 63.7626C253.847 63.7626 252.187 63.0267 250.941 61.5551C249.706 60.0726 249.088 58.0585 249.088 55.5126C249.088 52.7841 249.776 50.598 251.151 48.9545C252.526 47.3109 254.357 46.4891 256.645 46.4891C258.912 46.4891 260.561 47.3807 261.592 49.1639H261.656V38.9481H264.299V63.3759ZM261.656 55.9154V53.4823C261.656 52.1503 261.216 51.0223 260.335 50.0985C259.454 49.1747 258.337 48.7128 256.984 48.7128C255.372 48.7128 254.105 49.3036 253.181 50.4852C252.257 51.6669 251.795 53.2997 251.795 55.3837C251.795 57.285 252.236 58.7889 253.116 59.8954C254.008 60.9911 255.2 61.5389 256.694 61.5389C258.165 61.5389 259.358 61.0072 260.271 59.9437C261.195 58.8802 261.656 57.5375 261.656 55.9154Z" fill="black"/>
+<path d="M39.1268 65.5563C41.4335 63.2496 44.6392 62.7153 46.2868 64.363C47.9345 66.0106 47.4002 69.2163 45.0935 71.523C42.7868 73.8297 28.9835 81.6663 28.9835 81.6663C28.9835 81.6663 36.8201 67.863 39.1268 65.5563Z" fill="#FFC60F"/>
+<circle cx="45.0938" cy="35.1266" r="3.79717" transform="rotate(45 45.0938 35.1266)" fill="#F17F00"/>
+<circle cx="60.6072" cy="50.64" r="3.79717" transform="rotate(45 60.6072 50.64)" fill="#F17F00"/>
+<circle cx="83.8772" cy="27.37" r="3.79717" transform="rotate(45 83.8772 27.37)" fill="#F17F00"/>
+<circle cx="43.3037" cy="54.8165" r="3.79717" transform="rotate(45 43.3037 54.8165)" fill="#F17F00"/>
+<circle cx="75.5242" cy="65.557" r="3.79717" transform="rotate(45 75.5242 65.557)" fill="#F17F00"/>
+<circle cx="55.8342" cy="67.3469" r="3.79717" transform="rotate(45 55.8342 67.3469)" fill="#F17F00"/>
+<line x1="44.9435" y1="35.2895" x2="83.8057" y2="27.3551" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="75.3605" y1="66.0021" x2="83.8786" y2="27.2091" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="45.4887" y1="34.6734" x2="43.4618" y2="54.8914" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="43.1252" y1="54.6813" x2="61.0254" y2="50.2893" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="61.1444" y1="50.1853" x2="56.1741" y2="67.7838" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="55.7643" y1="67.0542" x2="75.8159" y2="65.1765" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="55.4005" y1="67.5749" x2="44.9725" y2="34.8883" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="75.6647" y1="65.5722" x2="43.083" y2="55.5333" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="60.3182" y1="50.4698" x2="83.8676" y2="27.2344" stroke="#F17F00" stroke-width="1.5"/>
+</svg>

From 04c5f5a4c7ed253e8fb4d7b5513a04c3040ccaf9 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Wed, 2 Mar 2022 02:38:43 +0500
Subject: [PATCH 13/20] fix format

---
 docs/Gemfile.lock                             |  8 ++--
 docs/_config.yml                              | 12 ++++-
 docs/_includes/masthead.html                  |  4 +-
 docs/_layouts/single-full.html                |  2 +-
 docs/_posts/2020-02-13-release.md             |  6 +--
 docs/_posts/2020-05-19-bert-record.md         |  4 +-
 docs/_posts/2020-05-19-press-release.md       |  4 +-
 docs/_posts/2020-05-19-zero-stage2.md         |  5 +-
 .../2020-09-08-sparse-attention-news.md       |  1 +
 docs/_posts/2020-09-09-ZeRO-Offload.md        |  5 +-
 ...0-10-28-progressive-layer-dropping-news.md |  1 +
 docs/_posts/2021-03-08-zero3-offload.md       | 10 ++--
 docs/_posts/2021-05-14-inference-release.md   |  2 +-
 docs/_posts/2021-11-15-autotuning.md          |  1 +
 docs/_posts/2021-12-09-deepspeed-moe-nlg.md   |  6 +--
 docs/_tutorials/zero.md                       |  2 +
 ...epspeed-logo-uppercase-bold-white-1.15.svg |  2 +-
 docs/index.md                                 |  7 +--
 docs/tags.md                                  | 48 -------------------
 docs/tags_list.md                             | 36 --------------
 20 files changed, 47 insertions(+), 119 deletions(-)
 delete mode 100644 docs/tags.md
 delete mode 100644 docs/tags_list.md

diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
index 657c3228370a..592d5adbced7 100644
--- a/docs/Gemfile.lock
+++ b/docs/Gemfile.lock
@@ -231,7 +231,7 @@ GEM
       jekyll (>= 3.5, < 5.0)
       jekyll-feed (~> 0.9)
       jekyll-seo-tag (~> 2.1)
-    minimal-mistakes-jekyll (4.20.2)
+    minimal-mistakes-jekyll (4.24.0)
       jekyll (>= 3.7, < 5.0)
       jekyll-feed (~> 0.1)
       jekyll-gist (~> 1.5)
@@ -248,9 +248,9 @@ GEM
       sawyer (~> 0.8.0, >= 0.5.3)
     pathutil (0.16.2)
       forwardable-extended (~> 2.6)
-    public_suffix (3.1.1)
+    public_suffix (4.0.6)
     racc (1.6.0)
-    rb-fsevent (0.10.4)
+    rb-fsevent (0.11.1)
     rb-inotify (0.10.1)
       ffi (~> 1.0)
     rexml (3.2.5)
@@ -277,7 +277,7 @@ GEM
       ethon (>= 0.9.0)
     tzinfo (1.2.9)
       thread_safe (~> 0.1)
-    tzinfo-data (1.2020.3)
+    tzinfo-data (1.2021.5)
       tzinfo (>= 1.0.0)
     unf (0.1.4)
       unf_ext
diff --git a/docs/_config.yml b/docs/_config.yml
index bb545716cec6..963e8734a8f2 100644
--- a/docs/_config.yml
+++ b/docs/_config.yml
@@ -5,6 +5,7 @@ description: >-
   training easy, efficient, and effective.
 
 locale : "en-US"
+logo: /assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg
 
 repository: microsoft/DeepSpeed
 baseurl: "/" # the subpath of your site, e.g. /blog
@@ -80,14 +81,21 @@ defaults:
       type: posts
     values:
       layout: single-full
-      classes: wide2
+      classes: wide
       author_profile: false
       read_time: false
       comments: false
       share: true
       related: false
-      toc: false
+      toc: true
+      toc_label: "Contents"
       show_date: true
+  - scope:
+      path: ""
+      type: tutorials
+    values:
+      classes: wide
+      layout: single
 
 analytics:
   provider: "google-gtag"
diff --git a/docs/_includes/masthead.html b/docs/_includes/masthead.html
index 47cce0a3545e..0a14c23ebde0 100644
--- a/docs/_includes/masthead.html
+++ b/docs/_includes/masthead.html
@@ -7,10 +7,10 @@
         {% unless logo_path == empty %}
           <a class="site-logo" href="{{ '/' | relative_url }}"><img src="{{ logo_path | relative_url }}" alt=""></a>
         {% endunless %}
-        <a class="site-title" href="{{ '/' | relative_url }}">
+        <!-- <a class="site-title" href="{{ '/' | relative_url }}">
           {{ site.masthead_title | default: site.title }}
           {% if site.subtitle %}<span class="site-subtitle">{{ site.subtitle }}</span>{% endif %}
-        </a>
+        </a> -->
         <ul class="visible-links">
           {%- for link in site.data.navigation.main -%}
             <li class="masthead__menu-item">
diff --git a/docs/_layouts/single-full.html b/docs/_layouts/single-full.html
index 8dce93ad491b..20268431ebdf 100644
--- a/docs/_layouts/single-full.html
+++ b/docs/_layouts/single-full.html
@@ -10,7 +10,7 @@
 
 <div id="main" role="main">
 
-  <article class="page" itemscope itemtype="https://schema.org/CreativeWork">
+  <article class="page" itemscope itemtype="https://schema.org/CreativeWork" style="margin: 0 auto;float:none;">
     {% if page.title %}<meta itemprop="headline" content="{{ page.title | markdownify | strip_html | strip_newlines | escape_once }}">{% endif %}
     {% if page.excerpt %}<meta itemprop="description" content="{{ page.excerpt | markdownify | strip_html | strip_newlines | escape_once }}">{% endif %}
     {% if page.date %}<meta itemprop="datePublished" content="{{ page.date | date_to_xmlschema }}">{% endif %}
diff --git a/docs/_posts/2020-02-13-release.md b/docs/_posts/2020-02-13-release.md
index 50581ca0c102..792ff7bfee67 100644
--- a/docs/_posts/2020-02-13-release.md
+++ b/docs/_posts/2020-02-13-release.md
@@ -1,7 +1,7 @@
 ---
 title: "ZeRO & DeepSpeed: New system optimizations enable training models with over 100 billion parameters"
 date:   2020-02-13
-link: https://www.microsoft.com/en-us/research/blog/zero-deepspeed-new-system-optimizations-enable-training-models-with-over-100-billion-parameters/
-excerpt: "Developed by Microsoft AI & Research."
-tags: training zero
+link: https://www.microsoft.com/en-us/research/blog/ZeRO-deepspeed-new-system-optimizations-enable-training-models-with-over-100-billion-parameters/
+excerpt: ""
+tags: training ZeRO
 ---
diff --git a/docs/_posts/2020-05-19-bert-record.md b/docs/_posts/2020-05-19-bert-record.md
index 47599a5a8aed..93d0c9ce34bd 100644
--- a/docs/_posts/2020-05-19-bert-record.md
+++ b/docs/_posts/2020-05-19-bert-record.md
@@ -3,6 +3,8 @@ title: "The Fastest and Most Efficient BERT Training through Optimized Transform
 excerpt: ""
 tags: training
 date: 2020-05-19 00:00:00
+toc: false
+tags: training
 ---
 
 We introduce new technology to accelerate single GPU performance via kernel
@@ -15,7 +17,7 @@ DeepSpeed achieves the fastest BERT training record: 44 minutes on 1,024
 NVIDIA V100 GPUs**, compared with the best published result of 67 minutes on
 the same number and generation of GPUs.
 
-* Brief overview, see our [press release](https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/).
+* Brief overview, see our [press release](https://www.microsoft.com/en-us/research/blog/ZeRO-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/).
 * Detailed technology deep dive, see our [blog post](https://www.deepspeed.ai/news/2020/05/27/fastest-bert-training.html).
 * Tutorial on how to reproduce our results, see our [BERT pre-training tutorial](https://www.deepspeed.ai/tutorials/bert-pretraining/).
 * The source code for our transformer kernels can be found in the [DeepSpeed repo](https://github.com/microsoft/deepspeed) and BERT pre-training code can be found in the [DeepSpeedExamples repo](https://github.com/microsoft/deepspeedexamples).
diff --git a/docs/_posts/2020-05-19-press-release.md b/docs/_posts/2020-05-19-press-release.md
index a4da131f06a1..9022a7db40c5 100644
--- a/docs/_posts/2020-05-19-press-release.md
+++ b/docs/_posts/2020-05-19-press-release.md
@@ -1,7 +1,7 @@
 ---
 title: "ZeRO-2 & DeepSpeed: Shattering Barriers of Deep Learning Speed & Scale"
 excerpt: ""
-link: https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/
-tags: training zero
+link: https://www.microsoft.com/en-us/research/blog/ZeRO-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/
+tags: training ZeRO
 date: 2020-05-19 02:00:00
 ---
diff --git a/docs/_posts/2020-05-19-zero-stage2.md b/docs/_posts/2020-05-19-zero-stage2.md
index 7c5a1e912a17..4f35012d9aae 100644
--- a/docs/_posts/2020-05-19-zero-stage2.md
+++ b/docs/_posts/2020-05-19-zero-stage2.md
@@ -1,8 +1,9 @@
 ---
 title: "An Order-of-Magnitude Larger and Faster Training with ZeRO-2"
 excerpt: ""
-tags: training zero
+tags: training ZeRO
 date: 2020-05-19 01:00:00
+toc: false
 ---
 
 ZeRO-2 expands the scope of memory optimizations in the original ZeRO by
@@ -15,7 +16,7 @@ learning training by an order of magnitude. More concretely, ZeRO-2 allows
 training models as large as 170 billion parameters up to 10x faster compared
 to state of the art.
 
-For more information on ZeRO-2, see our [blog post](https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/).
+For more information on ZeRO-2, see our [blog post](https://www.microsoft.com/en-us/research/blog/ZeRO-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/).
 
 For more information on how to use ZeRO-2, see an example of training GPT family of models in this [tutorial](/tutorials/megatron/).
 
diff --git a/docs/_posts/2020-09-08-sparse-attention-news.md b/docs/_posts/2020-09-08-sparse-attention-news.md
index 2ae615c45c82..4c37054a73c1 100644
--- a/docs/_posts/2020-09-08-sparse-attention-news.md
+++ b/docs/_posts/2020-09-08-sparse-attention-news.md
@@ -3,6 +3,7 @@ title: "Powering 10x longer sequences and 6x faster execution through DeepSpeed
 excerpt: ""
 tags: training
 date: 2020-09-09 00:00:00
+toc: false
 ---
 
 DeepSpeed offers sparse attention kernels, an instrumental technology to support long sequences of model inputs, whether for text, image, or sound. Compared with the classic dense Transformers, it powers an order-of-magnitude longer input sequence and obtains up to 6x faster execution with comparable accuracy. It also outperforms state-of-the-art sparse implementations with 1.5-3x faster execution. Furthermore, our sparse kernels support efficient execution of flexible sparse format and empower users to innovate on their custom sparse structures.
diff --git a/docs/_posts/2020-09-09-ZeRO-Offload.md b/docs/_posts/2020-09-09-ZeRO-Offload.md
index 353b8b50f701..c270ceadf381 100755
--- a/docs/_posts/2020-09-09-ZeRO-Offload.md
+++ b/docs/_posts/2020-09-09-ZeRO-Offload.md
@@ -2,11 +2,12 @@
 title: "10x bigger model training on a single GPU with ZeRO-Offload"
 excerpt: ""
 date: 2020-09-09 00:00:00
-tags: training zero
+tags: training ZeRO
+toc: false
 ---
 
 We introduce a new technology called ZeRO-Offload to enable **10X bigger model training on a single GPU**. ZeRO-Offload extends ZeRO-2 to leverage both CPU and GPU memory for training large models. Using a machine with **a single GPU**, our users now can run **models of up to 13 billion parameters** without running out of memory, 10x bigger than the existing approaches, while obtaining competitive throughput. This feature democratizes multi-billion-parameter model training and opens the window for many deep learning practitioners to explore bigger and better models.
 
 * For more information on ZeRO-Offload, see our [press release]( {{ site.press_release_v3 }} ).
-* For more information on how to use ZeRO-Offload, see our [ZeRO-Offload tutorial](https://www.deepspeed.ai/tutorials/zero-offload/).
+* For more information on how to use ZeRO-Offload, see our [ZeRO-Offload tutorial](https://www.deepspeed.ai/tutorials/ZeRO-offload/).
 * The source code for ZeRO-Offload can be found in the [DeepSpeed repo](https://github.com/microsoft/deepspeed).
diff --git a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
index b55d1cb7d8cf..9664e4de94e7 100755
--- a/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
+++ b/docs/_posts/2020-10-28-progressive-layer-dropping-news.md
@@ -3,6 +3,7 @@ title: "Progressive Layer Dropping"
 excerpt: ""
 date: 2020-10-29 00:00:00
 tags: training
+toc: false
 ---
 
 We introduce a new technology called progressive layer dropping (PLD) to speedup the pre-training of Transformer-based networks through efficient and robust compressed training. The pre-training step of Transformer networks often suffer from unbearable overall computational expenses. We analyze the training dynamics and stability of Transformer networks and propose PLD to sparsely update Transformer blocks following a progressive dropping schedule, which smoothly increases the layer dropping rate for each mini-batch as training evolves along both the temporal and the model depth dimension. PLD is able to allow the pre-training to be **2.5X faster** to get similar accuracy on downstream tasks and allows the training to be **24% faster** when training the same number of samples, not at the cost of excessive hardware resources.
diff --git a/docs/_posts/2021-03-08-zero3-offload.md b/docs/_posts/2021-03-08-zero3-offload.md
index 2ce5ef919a0d..9008ebc9f6fa 100644
--- a/docs/_posts/2021-03-08-zero3-offload.md
+++ b/docs/_posts/2021-03-08-zero3-offload.md
@@ -2,7 +2,7 @@
 title: "DeepSpeed ZeRO-3 Offload"
 excerpt: ""
 date: 2021-03-08 00:00:00
-tags: training zero
+tags: training ZeRO
 ---
 Today we are announcing the release of ZeRO-3 Offload, a highly efficient and easy to use implementation of ZeRO Stage 3 and ZeRO Offload combined, geared towards our continued goal of democratizing AI by making efficient large-scale DL training available to everyone.  The key benefits of ZeRO-3 Offload are:
 
@@ -17,7 +17,7 @@ Today we are announcing the release of ZeRO-3 Offload, a highly efficient and ea
 
 <h2> Overview of ZeRO family of technology </h2>
 
-The Zero Redundancy Optimizer (abbreviated ZeRO) is a family of memory optimization technologies for large-scale distributed deep learning. Unlike data parallelism (that is efficient but can only support a limited model size) or model parallelism (that can support larger model sizes but requires significant code refactoring while adding communication overhead that limits efficiency), ZeRO allows fitting larger models in memory without requiring code refactoring while remaining very efficient. ZeRO does so by eliminating the memory redundancy that is inherent in data parallelism while limiting the communication overhead to a minimum.
+The ZeRO Redundancy Optimizer (abbreviated ZeRO) is a family of memory optimization technologies for large-scale distributed deep learning. Unlike data parallelism (that is efficient but can only support a limited model size) or model parallelism (that can support larger model sizes but requires significant code refactoring while adding communication overhead that limits efficiency), ZeRO allows fitting larger models in memory without requiring code refactoring while remaining very efficient. ZeRO does so by eliminating the memory redundancy that is inherent in data parallelism while limiting the communication overhead to a minimum.
 ZeRO removes the memory redundancies across data-parallel processes by partitioning the three model states (optimizer states, gradients, and parameters) across data-parallel processes instead of replicating them. By doing this, it boosts memory efficiency compared to classic data-parallelism while retaining its computational granularity and communication efficiency.
 There are three stages in ZeRO corresponding to three model states, as shown in the Figure 1: the first stage (ZeRO-1) partitions only the optimizer states, the second stage (ZeRO-2) partitions both the optimizer states and the gradients and the final stage (ZeRO-3) partitions all three model states (for more details see the ZeRO [paper](https://arxiv.org/abs/1910.02054v3)).
 
@@ -28,8 +28,8 @@ Figure 1. Overview of ZeRO memory savings
 
 In addition to these three stages, ZeRO family of technology also consists of ZeRO-2 Offload. ZeRO-2 Offload is a heterogeneous DL training technology that works in conjunction with ZeRO-2 to offload partitioned optimizer states and gradients to CPU memory. ZeRO-2 Offload offers the full memory advantage of ZeRO-2 even on a single GPU, while at the same time offering great scalability of ZeRO-2 on multi-GPU setup.  DeepSpeed library has been offering ZeRO-2 Offload since Sept 2020. For details, please see below:
 
-* ZeRO: [Stage 1 blog](https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/), [Stage 2 blog](https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/), [Tutorial](/tutorials/zero)
-* ZeRO-Offload: [Blog](https://www.microsoft.com/en-us/research/blog/deepspeed-extreme-scale-model-training-for-everyone/#toc-heading-3), [Tutorials](/tutorials/zero-offload), [Paper link](https://arxiv.org/abs/2101.06840)
+* ZeRO: [Stage 1 blog](https://www.microsoft.com/en-us/research/blog/ZeRO-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/), [Stage 2 blog](https://www.microsoft.com/en-us/research/blog/ZeRO-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/), [Tutorial](/tutorials/ZeRO)
+* ZeRO-Offload: [Blog](https://www.microsoft.com/en-us/research/blog/deepspeed-extreme-scale-model-training-for-everyone/#toc-heading-3), [Tutorials](/tutorials/ZeRO-offload), [Paper link](https://arxiv.org/abs/2101.06840)
 
 <h2>ZeRO-3 Offload</h2>
 With today’s release of ZeRO-3 Offload, we are adding support for partitioning and offloading parameters in addition to optimizer states and gradients partitioning already supported by ZeRO-2 Offload in DeepSpeed. With parameter partitioning ZeRO-3 Offload implements the full set of features in the three stages of ZeRO, that allows for a linear growth in model size with the number of GPUs. In addition, ZeRO-3 Offload can also optionally offload all these model states to CPU to further reduce GPU memory consumption, leveraging both CPU and GPU to maximize memory and compute efficiency of the entire system.
@@ -93,6 +93,6 @@ If you are already a DeepSpeed user, you can find our detailed tutorial on ZeRO-
 
 * DeepSpeed: [Getting Started Page](/getting-started/)
 
-* ZeRO-3 Offload [Documentation](https://deepspeed.readthedocs.io/en/latest/zero3.html), [Tutorial](/tutorials/zero/#training-trillion-scale-models-with-zero-3-offload)
+* ZeRO-3 Offload [Documentation](https://deepspeed.readthedocs.io/en/latest/zero3.html), [Tutorial](/tutorials/ZeRO/#training-trillion-scale-models-with-ZeRO-3-offload)
 
 The DeepSpeed Team is very excited to share ZeRO-3 Offload with the DL community.
diff --git a/docs/_posts/2021-05-14-inference-release.md b/docs/_posts/2021-05-14-inference-release.md
index 94e69503c40c..fd5cca2e0259 100644
--- a/docs/_posts/2021-05-14-inference-release.md
+++ b/docs/_posts/2021-05-14-inference-release.md
@@ -2,6 +2,6 @@
 title: "DeepSpeed: Accelerating large-scale model inference and training via system optimizations and compression"
 date:   2021-05-14
 link: https://www.microsoft.com/en-us/research/blog/deepspeed-accelerating-large-scale-model-inference-and-training-via-system-optimizations-and-compression/
-excerpt: "Developed by Microsoft AI & Research."
+excerpt: ""
 tags: inference
 ---
diff --git a/docs/_posts/2021-11-15-autotuning.md b/docs/_posts/2021-11-15-autotuning.md
index 650f099ecb29..ee48d44c5bdf 100644
--- a/docs/_posts/2021-11-15-autotuning.md
+++ b/docs/_posts/2021-11-15-autotuning.md
@@ -3,6 +3,7 @@ title: "Autotuning: Automatically discover the optimal DeepSpeed configuration t
 excerpt: ""
 date: 2021-11-16 10:00:00
 tags: training
+toc: false
 ---
 
 We introduce a new feature called Autotuning to automatically discover the optimal DeepSpeed configuration that delivers good training speed. One pain point in model training is to figure out good performance-relevant configurations such as micro-batch size to fully utilize the hardware and achieve a high throughput number. This configuration exploring process is commonly done manually but is important since model training is repeated many times and benefits from using a good configuration. Not only is the hand-tuning process time-consuming, but the outcome is hardware-dependent. This means that a good configuration on one hardware might not be the best on another different hardware. The user thus has to hand tune the configuration again. With DeepSpeed, there are more configuration parameters that could potentially affect the training speed, thus making it more tedious to manually tune the configuration.
diff --git a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
index 99bc86cbd5d2..6402202cca3b 100644
--- a/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
+++ b/docs/_posts/2021-12-09-deepspeed-moe-nlg.md
@@ -5,8 +5,6 @@ date: 2021-12-09 22:00:00
 tags: training
 ---
 
-[By DeepSpeed Team](https://www.microsoft.com/en-us/research/project/deepspeed/people/)
-
 Autoregressive transformer-based natural language generation (referred to as
 NLG in the rest of the blog) models can offer convincing solutions to a broad
 range of language tasks from document summarization, headline generation,
@@ -88,7 +86,7 @@ the validation loss of the MoE model, 350M+MoE-128, is on par with the
 validation loss of the 1.3B dense model with 4x larger base.  This is also true
 for 1.3B+MoE-128 in comparison with 6.7B dense model with 5x larger base.
 Furthermore, the model quality is on par not only for the validation loss but
-also for a wide variety of 6 zero-shot evaluation tasks as shown in Table 1,
+also for a wide variety of 6 ZeRO-shot evaluation tasks as shown in Table 1,
 demonstrating that these models in fact have very similar model quality.
 
 ![MoE NLG](/assets/images/moe-nlg.png){: .align-center}
@@ -105,7 +103,7 @@ Figure 1: Token-wise validation loss curves for dense and MoE NLG models with di
 | 350M+MoE-128 (13B) | 0.6270 | 0.7459 | 0.6046 | 0.3560 | 0.1658 | 0.0517 |
 | 1.3B+MoE-128 (52B) | 0.6984 | 0.7671 | 0.6492 | 0.3809 | 0.3129 | 0.0719 |
 
-Table 1: Zero-shot evaluation results (last six columns) for different dense and MoE NLG models. All zero-shot evaluation results use the accuracy metric.
+Table 1: ZeRO-shot evaluation results (last six columns) for different dense and MoE NLG models. All ZeRO-shot evaluation results use the accuracy metric.
 
 ## Same quality with 5x less training cost
 
diff --git a/docs/_tutorials/zero.md b/docs/_tutorials/zero.md
index 9f858a067162..29e5c7f335a1 100644
--- a/docs/_tutorials/zero.md
+++ b/docs/_tutorials/zero.md
@@ -1,7 +1,9 @@
 ---
 title: "Zero Redundancy Optimizer (ZeRO)"
+excerpt: ""
 tags: training
 ---
+
 If you have not done so already, we advise that you read the DeepSpeed tutorials on [Getting Started](/getting-started/) and [Megatron-LM GPT-2](/tutorials/megatron/) before stepping through this tutorial.
 
 In this tutorial, we will apply the ZeRO optimizer to the [Megatron-LM GPT-2](https://github.com/NVIDIA/Megatron-LM) model. ZeRO is a powerful set of memory optimization techniques that enable effective training of large models with trillions of parameters, such as [GPT-2](https://openai.com/blog/better-language-models/) and [Turing-NLG 17B](https://www.microsoft.com/en-us/research/blog/turing-nlg-a-17-billion-parameter-language-model-by-microsoft/). Compared to the alternative model parallelism approaches for training large models, a key appeal of ZeRO is that no model code modifications are required. As this tutorial will demonstrate, *using ZeRO in a DeepSpeed model is quick and easy because all you need is to change a few configurations in the DeepSpeed configuration JSON*. No code changes are needed.
diff --git a/docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg b/docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg
index 1cb9f7575a00..cc2b5736b16a 100644
--- a/docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg
+++ b/docs/assets/images/deepspeed-logo-uppercase-bold-white-1.15.svg
@@ -21,4 +21,4 @@
     <path d="M75.6647 56.5722L43.083 46.5333" stroke="#F17F00" stroke-width="1.5" fill="none" />
     <path d="M60.3182 41.4698L83.8676 18.2344" stroke="#F17F00" stroke-width="1.5" fill="none" />
 </g>
-</svg>
\ No newline at end of file
+</svg>
diff --git a/docs/index.md b/docs/index.md
index ae9ae491fbfe..30641b011242 100755
--- a/docs/index.md
+++ b/docs/index.md
@@ -2,13 +2,10 @@
 layout: single
 toc: true
 toc_label: "Contents"
----
+title: "Latest News"
 
-<div align="center">
- <img src="/assets/images/DeepSpeed_light_transparent.svg" width="500px">
-</div>
+---
 
-## Latest News
 * [2022/1/19] [DeepSpeed: Advancing MoE inference and training to power next-generation AI scale](https://www.microsoft.com/en-us/research/blog/deepspeed-advancing-moe-inference-and-training-to-power-next-generation-ai-scale/)
     * [Mixture of Experts (MoE) for NLG tutorial](https://www.deepspeed.ai/tutorials/mixture-of-experts-nlg/).
     * [Mixture of Experts (MoE) Inference tutorial](https://www.deepspeed.ai/tutorials/moe-inference-tutorial).
diff --git a/docs/tags.md b/docs/tags.md
deleted file mode 100644
index fb704ffaa808..000000000000
--- a/docs/tags.md
+++ /dev/null
@@ -1,48 +0,0 @@
----
-layout: archive
-permalink: /posts/
----
-
-{% if paginator %}
-  {% assign posts = paginator.posts %}
-{% else %}
-  {% assign posts = site.posts %}
-{% endif %}
-
-<script type="text/javascript">
-    function filterUsingCategory(selectedCategory) {
-      {% for post in posts %}
-        var cats = {{ post.tags | jsonify }}
-
-        var postDiv = document.getElementById("post-{{post.title | slugify}}");
-        postDiv.style.display = (selectedCategory == 'All' || cats.includes(selectedCategory))
-          ? 'unset'
-          : 'none';
-      {% endfor %}
-    }
-</script>
-
-  <div class="btn-group">
-    <button id="All" class="button-71" role="button" onclick="filterUsingCategory('All')">All ({{ posts.size }})</button>
-    {% assign tags = site.tags | sort %}
-    {% for category in tags %}
-      {% assign cat = category | first %}
-      <button id="{{ cat }}" class="button-71" role="button" onclick="filterUsingCategory(this.id)">{{ cat }} ({{ site.tags[cat].size }})</button>
-    {% endfor %}
-    <hr />
-  </div>
-
-  <div class="posts-wrapper">
-    {% for post in posts %}
-      <div class="post" id="post-{{post.title | slugify}}">
-        <p class="itemInteriorSection">
-          {%- unless post.hidden -%}
-            {% include archive-single.html %}
-            {% if post.image %}
-              <a href="{{ post.link }}"><img src="{{ post.image }}"></a>
-            {% endif %}
-          {%- endunless -%}
-        </p>
-      </div>
-    {% endfor %}
-  </div>
diff --git a/docs/tags_list.md b/docs/tags_list.md
deleted file mode 100644
index 532cd0c62ea6..000000000000
--- a/docs/tags_list.md
+++ /dev/null
@@ -1,36 +0,0 @@
----
-layout: archive
-permalink: /tags/
----
-
-{% assign sorted_tags = (site.tags | sort:0) %}
-<ul class="tag-box">
-	{% for tag in sorted_tags %}
-		{% assign t = tag | first %}
-		{% assign ps = tag | last %}
-		<li><a href="#{{ t | downcase }}">{{ t }} <span class="size">({{ ps.size }})</span></a></li>
-	{% endfor %}
-</ul>
-
-{% for tag in sorted_tags %}
-  {% assign t = tag | first %}
-  {% assign posts = tag | last %}
-  <div style="text-transform:capitalize;">
-    <h4 id="{{ t | downcase }}">{{ t }}</h4>
-  </div>
-  <ul>
-  {% for post in posts %}
-    {% if post.tags contains t %}
-      {% if post.link %}
-        <li>
-          <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.link }}">{{ post.title }}</a>
-        </li>
-      {% else %}
-        <li>
-          <span class="date">{{ post.date | date: '%d %b %y' }}</span>:  <a href="{{ post.url }}">{{ post.title }}</a>
-        </li>
-      {% endif %}
-    {% endif %}
-  {% endfor %}
-  </ul>
-{% endfor %}

From 7fcd2669b1e27833d1316d4ccd0141bcd07a52e1 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Wed, 2 Mar 2022 05:01:29 +0500
Subject: [PATCH 14/20] widen main context column

---
 docs/_config.yml                             |   8 +-
 docs/_data/navigation.yml                    |   6 +-
 docs/_sass/minimal-mistakes/_navigation.scss | 573 +++++++++++++++++++
 docs/_sass/minimal-mistakes/_variables.scss  |   2 +-
 docs/_tutorials/large-models-w-deepspeed.md  |   2 +-
 docs/_tutorials/pipeline.md                  |   2 +-
 docs/_tutorials/sparse-attention.md          |   2 +-
 docs/_tutorials/zero-offload.md              |   2 +-
 docs/_tutorials/zero.md                      |   4 +-
 docs/index.md                                |   2 +-
 10 files changed, 589 insertions(+), 14 deletions(-)
 create mode 100644 docs/_sass/minimal-mistakes/_navigation.scss

diff --git a/docs/_config.yml b/docs/_config.yml
index 963e8734a8f2..35e9e5bc064d 100644
--- a/docs/_config.yml
+++ b/docs/_config.yml
@@ -14,6 +14,7 @@ url: "https://www.deepspeed.ai" # the base hostname & protocol for your site, e.
 # Build settings
 remote_theme: "mmistakes/minimal-mistakes@4.19.0"
 minimal_mistakes_skin : "air"
+search: true
 
 plugins:
   - jekyll-feed
@@ -46,7 +47,7 @@ collections:
       - megatron.md
       - mixture-of-experts.md
       - mixture-of-experts-nlg.md
-      - moe-inference.md
+      - mixture-of-experts-inference.md
       - one-cycle.md
       - onebit-adam.md
       - onebit-lamb.md
@@ -81,7 +82,6 @@ defaults:
       type: posts
     values:
       layout: single-full
-      classes: wide
       author_profile: false
       read_time: false
       comments: false
@@ -89,13 +89,15 @@ defaults:
       related: false
       toc: true
       toc_label: "Contents"
+      toc_sticky: true
       show_date: true
   - scope:
       path: ""
       type: tutorials
     values:
-      classes: wide
       layout: single
+      toc_sticky: true
+
 
 analytics:
   provider: "google-gtag"
diff --git a/docs/_data/navigation.yml b/docs/_data/navigation.yml
index 21bf5fc14a20..924c02c1bbc3 100755
--- a/docs/_data/navigation.yml
+++ b/docs/_data/navigation.yml
@@ -94,9 +94,9 @@ lnav:
         url: /tutorials/megatron/
       - title: 'Mixture-of-Experts (MoE)'
         url: /tutorials/mixture-of-experts/
-      - title: 'Mixture-of-Experts for NLG'
+      - title: 'MoE for NLG'
         url: /tutorials/mixture-of-experts-nlg/
-      - title: 'Mixture-of-Experts Inference'
+      - title: 'MoE Inference'
         url: /tutorials/mixture-of-experts-inference/
       - title: 'Mixture-of-Quantization'
         url: /tutorials/MoQ-tutorial/
@@ -116,7 +116,7 @@ lnav:
         url: /tutorials/transformer_kernel/
       - title: 'ZeRO-Offload'
         url: /tutorials/zero-offload/
-      - title: 'ZeRO Redundancy Optimizer (ZeRO)'
+      - title: 'ZeRO'
         url: /tutorials/zero/
   - title: 'Contributing'
     url: /contributing/
diff --git a/docs/_sass/minimal-mistakes/_navigation.scss b/docs/_sass/minimal-mistakes/_navigation.scss
new file mode 100644
index 000000000000..5505714219bb
--- /dev/null
+++ b/docs/_sass/minimal-mistakes/_navigation.scss
@@ -0,0 +1,573 @@
+/* ==========================================================================
+   NAVIGATION
+   ========================================================================== */
+
+/*
+   Breadcrumb navigation links
+   ========================================================================== */
+
+.breadcrumbs {
+  @include clearfix;
+  margin: 0 auto;
+  max-width: 100%;
+  padding-left: 1em;
+  padding-right: 1em;
+  font-family: $sans-serif;
+  -webkit-animation: $intro-transition;
+  animation: $intro-transition;
+  -webkit-animation-delay: 0.3s;
+  animation-delay: 0.3s;
+
+  @include breakpoint($x-large) {
+    max-width: $x-large;
+  }
+
+  ol {
+    padding: 0;
+    list-style: none;
+    font-size: $type-size-6;
+
+    @include breakpoint($large) {
+      float: right;
+      width: calc(100% - #{$right-sidebar-width-narrow});
+    }
+
+    @include breakpoint($x-large) {
+      width: calc(100% - #{$right-sidebar-width});
+    }
+  }
+
+  li {
+    display: inline;
+  }
+
+  .current {
+    font-weight: bold;
+  }
+}
+
+/*
+     Post pagination navigation links
+     ========================================================================== */
+
+.pagination {
+  @include clearfix();
+  float: left;
+  margin-top: 1em;
+  padding-top: 1em;
+  width: 100%;
+
+  ul {
+    margin: 0;
+    padding: 0;
+    list-style-type: none;
+    font-family: $sans-serif;
+  }
+
+  li {
+    display: block;
+    float: left;
+    margin-left: -1px;
+
+    a {
+      display: block;
+      margin-bottom: 0.25em;
+      padding: 0.5em 1em;
+      font-family: $sans-serif;
+      font-size: 14px;
+      font-weight: bold;
+      line-height: 1.5;
+      text-align: center;
+      text-decoration: none;
+      color: $muted-text-color;
+      border: 1px solid mix(#000, $border-color, 25%);
+      border-radius: 0;
+
+      &:hover {
+        color: $link-color-hover;
+      }
+
+      &.current,
+      &.current.disabled {
+        color: #fff;
+        background: $primary-color;
+      }
+
+      &.disabled {
+        color: rgba($muted-text-color, 0.5);
+        pointer-events: none;
+        cursor: not-allowed;
+      }
+    }
+
+    &:first-child {
+      margin-left: 0;
+
+      a {
+        border-top-left-radius: $border-radius;
+        border-bottom-left-radius: $border-radius;
+      }
+    }
+
+    &:last-child {
+      a {
+        border-top-right-radius: $border-radius;
+        border-bottom-right-radius: $border-radius;
+      }
+    }
+  }
+
+  /* next/previous buttons */
+  &--pager {
+    display: block;
+    padding: 1em 2em;
+    float: left;
+    width: 50%;
+    font-family: $sans-serif;
+    font-size: $type-size-5;
+    font-weight: bold;
+    text-align: center;
+    text-decoration: none;
+    color: $muted-text-color;
+    border: 1px solid mix(#000, $border-color, 25%);
+    border-radius: $border-radius;
+
+    &:hover {
+      @include yiq-contrasted($muted-text-color);
+    }
+
+    &:first-child {
+      border-top-right-radius: 0;
+      border-bottom-right-radius: 0;
+    }
+
+    &:last-child {
+      margin-left: -1px;
+      border-top-left-radius: 0;
+      border-bottom-left-radius: 0;
+    }
+
+    &.disabled {
+      color: rgba($muted-text-color, 0.5);
+      pointer-events: none;
+      cursor: not-allowed;
+    }
+  }
+}
+
+.page__content + .pagination,
+.page__meta + .pagination,
+.page__share + .pagination,
+.page__comments + .pagination {
+  margin-top: 2em;
+  padding-top: 2em;
+  border-top: 1px solid $border-color;
+}
+
+/*
+     Priority plus navigation
+     ========================================================================== */
+
+.greedy-nav {
+  position: relative;
+  display: -webkit-box;
+  display: -ms-flexbox;
+  display: flex;
+  -webkit-box-align: center;
+  -ms-flex-align: center;
+  align-items: center;
+  min-height: $nav-height;
+  background: $background-color;
+
+  a {
+    display: block;
+    margin: 0 1rem;
+    color: $masthead-link-color;
+    text-decoration: none;
+    -webkit-transition: none;
+    transition: none;
+
+    &:hover {
+      color: $masthead-link-color-hover;
+    }
+
+    &.site-logo {
+      margin-left: 0;
+      margin-right: 0.5rem;
+    }
+
+    &.site-title {
+      margin-left: 0;
+    }
+  }
+
+  img{
+    -webkit-transition: none;
+    transition: none;
+  }
+
+  &__toggle {
+    -ms-flex-item-align: center;
+    align-self: center;
+    height: $nav-toggle-height;
+    border: 0;
+    outline: none;
+    background-color: transparent;
+    cursor: pointer;
+  }
+
+  .visible-links {
+    display: -webkit-box;
+    display: -ms-flexbox;
+    display: flex;
+    -webkit-box-pack: end;
+    -ms-flex-pack: end;
+    justify-content: flex-end;
+    -webkit-box-flex: 1;
+    -ms-flex: 1;
+    flex: 1;
+    overflow: hidden;
+
+    li {
+      -webkit-box-flex: 0;
+      -ms-flex: none;
+      flex: none;
+    }
+
+    a {
+      position: relative;
+
+      &:before {
+        content: "";
+        position: absolute;
+        left: 0;
+        bottom: 0;
+        height: 4px;
+        background: $primary-color;
+        width: 100%;
+        -webkit-transition: $global-transition;
+        transition: $global-transition;
+        -webkit-transform: scaleX(0) translate3d(0, 0, 0);
+        transform: scaleX(0) translate3d(0, 0, 0); // hide
+      }
+
+      &:hover:before {
+        -webkit-transform: scaleX(1);
+        -ms-transform: scaleX(1);
+        transform: scaleX(1); // reveal
+      }
+    }
+  }
+
+  .hidden-links {
+    position: absolute;
+    top: 100%;
+    right: 0;
+    margin-top: 15px;
+    padding: 5px;
+    border: 1px solid $border-color;
+    border-radius: $border-radius;
+    background: $background-color;
+    -webkit-box-shadow: 0 2px 4px 0 rgba(#000, 0.16),
+      0 2px 10px 0 rgba(#000, 0.12);
+    box-shadow: 0 2px 4px 0 rgba(#000, 0.16), 0 2px 10px 0 rgba(#000, 0.12);
+
+    &.hidden {
+      display: none;
+    }
+
+    a {
+      margin: 0;
+      padding: 10px 20px;
+      font-size: $type-size-5;
+
+      &:hover {
+        color: $masthead-link-color-hover;
+        background: $navicon-link-color-hover;
+      }
+    }
+
+    &:before {
+      content: "";
+      position: absolute;
+      top: -11px;
+      right: 10px;
+      width: 0;
+      border-style: solid;
+      border-width: 0 10px 10px;
+      border-color: $border-color transparent;
+      display: block;
+      z-index: 0;
+    }
+
+    &:after {
+      content: "";
+      position: absolute;
+      top: -10px;
+      right: 10px;
+      width: 0;
+      border-style: solid;
+      border-width: 0 10px 10px;
+      border-color: $background-color transparent;
+      display: block;
+      z-index: 1;
+    }
+
+    li {
+      display: block;
+      border-bottom: 1px solid $border-color;
+
+      &:last-child {
+        border-bottom: none;
+      }
+    }
+  }
+}
+
+.no-js {
+  .greedy-nav {
+    .visible-links {
+      -ms-flex-wrap: wrap;
+      flex-wrap: wrap;
+      overflow: visible;
+    }
+  }
+}
+
+/*
+     Navigation list
+     ========================================================================== */
+
+.nav__list {
+  margin-bottom: 1.5em;
+
+  input[type="checkbox"],
+  label {
+    display: none;
+  }
+
+  @include breakpoint(max-width $large - 1px) {
+    label {
+      position: relative;
+      display: inline-block;
+      padding: 0.5em 2.5em 0.5em 1em;
+      color: $gray;
+      font-size: $type-size-6;
+      font-weight: bold;
+      border: 1px solid $light-gray;
+      border-radius: $border-radius;
+      z-index: 20;
+      -webkit-transition: 0.2s ease-out;
+      transition: 0.2s ease-out;
+      cursor: pointer;
+
+      &:before,
+      &:after {
+        content: "";
+        position: absolute;
+        right: 1em;
+        top: 1.25em;
+        width: 0.75em;
+        height: 0.125em;
+        line-height: 1;
+        background-color: $gray;
+        -webkit-transition: 0.2s ease-out;
+        transition: 0.2s ease-out;
+      }
+
+      &:after {
+        -webkit-transform: rotate(90deg);
+        -ms-transform: rotate(90deg);
+        transform: rotate(90deg);
+      }
+
+      &:hover {
+        color: #fff;
+        border-color: $gray;
+        background-color: mix(white, #000, 20%);
+
+        &:before,
+        &:after {
+          background-color: #fff;
+        }
+      }
+    }
+
+    /* selected*/
+    input:checked + label {
+      color: white;
+      background-color: mix(white, #000, 20%);
+
+      &:before,
+      &:after {
+        background-color: #fff;
+      }
+    }
+
+    /* on hover show expand*/
+    label:hover:after {
+      -webkit-transform: rotate(90deg);
+      -ms-transform: rotate(90deg);
+      transform: rotate(90deg);
+    }
+
+    input:checked + label:hover:after {
+      -webkit-transform: rotate(0);
+      -ms-transform: rotate(0);
+      transform: rotate(0);
+    }
+
+    ul {
+      margin-bottom: 1em;
+    }
+
+    a {
+      display: block;
+      padding: 0.25em 0;
+
+      @include breakpoint($large) {
+        padding-top: 0.125em;
+        padding-bottom: 0.125em;
+      }
+
+      &:hover {
+        text-decoration: underline;
+      }
+    }
+  }
+}
+
+.nav__list .nav__items {
+  margin: 0;
+  font-size: 1.25rem;
+
+  a {
+    color: inherit;
+  }
+
+  .active {
+    margin-left: -0.5em;
+    padding-left: 0.5em;
+    padding-right: 0.5em;
+    font-weight: bold;
+  }
+
+  @include breakpoint(max-width $large - 1px) {
+    position: relative;
+    max-height: 0;
+    opacity: 0%;
+    overflow: hidden;
+    z-index: 10;
+    -webkit-transition: 0.3s ease-in-out;
+    transition: 0.3s ease-in-out;
+    -webkit-transform: translate(0, 10%);
+    -ms-transform: translate(0, 10%);
+    transform: translate(0, 10%);
+  }
+}
+
+@include breakpoint(max-width $large - 1px) {
+  .nav__list input:checked ~ .nav__items {
+    -webkit-transition: 0.5s ease-in-out;
+    transition: 0.5s ease-in-out;
+    max-height: 9999px; /* exaggerate max-height to accommodate tall lists*/
+    overflow: visible;
+    opacity: 1;
+    margin-top: 1em;
+    -webkit-transform: translate(0, 0);
+    -ms-transform: translate(0, 0);
+    transform: translate(0, 0);
+  }
+}
+
+.nav__title {
+  margin: 0;
+  padding: 0.5rem 0.75rem;
+  font-family: $sans-serif-narrow;
+  font-size: $type-size-5;
+  font-weight: bold;
+}
+
+.nav__sub-title {
+  display: block;
+  margin: 0.5rem 0;
+  padding: 0.25rem 0;
+  font-family: $sans-serif-narrow;
+  font-size: $type-size-6;
+  font-weight: bold;
+  text-transform: uppercase;
+  border-bottom: 1px solid $border-color;
+}
+
+/*
+     Table of contents navigation
+     ========================================================================== */
+
+.toc {
+  font-family: $sans-serif-narrow;
+  color: $gray;
+  background-color: $background-color;
+  border: 1px solid $border-color;
+  border-radius: $border-radius;
+  -webkit-box-shadow: $box-shadow;
+  box-shadow: $box-shadow;
+
+  .nav__title {
+    color: #fff;
+    font-size: $type-size-6;
+    background: $primary-color;
+    border-top-left-radius: $border-radius;
+    border-top-right-radius: $border-radius;
+  }
+
+  // Scrollspy marks toc items as .active when they are in focus
+  .active a {
+    @include yiq-contrasted($active-color);
+  }
+}
+
+.toc__menu {
+  margin: 0;
+  padding: 0;
+  width: 100%;
+  list-style: none;
+  font-size: $type-size-6;
+
+  @include breakpoint($large) {
+    font-size: $type-size-7;
+  }
+
+  a {
+    display: block;
+    padding: 0.25rem 0.75rem;
+    color: $muted-text-color;
+    font-weight: bold;
+    line-height: 1.5;
+    border-bottom: 1px solid $border-color;
+
+    &:hover {
+      color: $text-color;
+    }
+  }
+
+  li ul > li a {
+    padding-left: 1.25rem;
+    font-weight: normal;
+  }
+
+  li ul li ul > li a {
+    padding-left: 1.75rem;
+  }
+
+  li ul li ul li ul > li a {
+    padding-left: 2.25rem;
+  }
+
+  li ul li ul li ul li ul > li a {
+    padding-left: 2.75rem;
+  }
+
+  li ul li ul li ul li ul li ul > li a {
+    padding-left: 3.25rem
+  }
+}
diff --git a/docs/_sass/minimal-mistakes/_variables.scss b/docs/_sass/minimal-mistakes/_variables.scss
index f7143ca81364..49016db40c9f 100644
--- a/docs/_sass/minimal-mistakes/_variables.scss
+++ b/docs/_sass/minimal-mistakes/_variables.scss
@@ -144,7 +144,7 @@ $small: 600px !default;
 $medium: 768px !default;
 $medium-wide: 900px !default;
 $large: 1024px !default;
-$x-large: 1280px !default;
+$x-large: 2560px !default;
 $max-width: $x-large !default;
 
 /*
diff --git a/docs/_tutorials/large-models-w-deepspeed.md b/docs/_tutorials/large-models-w-deepspeed.md
index 177199304a5c..ea6145cb6ae5 100644
--- a/docs/_tutorials/large-models-w-deepspeed.md
+++ b/docs/_tutorials/large-models-w-deepspeed.md
@@ -1,6 +1,6 @@
 ---
 title: "Training your large model with DeepSpeed"
-tags: training
+tags: training large-model
 ---
 
 ## Overview
diff --git a/docs/_tutorials/pipeline.md b/docs/_tutorials/pipeline.md
index 4454de00038f..8eff1d996c04 100644
--- a/docs/_tutorials/pipeline.md
+++ b/docs/_tutorials/pipeline.md
@@ -1,6 +1,6 @@
 ---
 title: "Pipeline Parallelism"
-tags: training
+tags: training large-model
 ---
 
 DeepSpeed v0.3 includes new support for pipeline parallelism! Pipeline
diff --git a/docs/_tutorials/sparse-attention.md b/docs/_tutorials/sparse-attention.md
index bad6bf627d90..d28b2d1ff33c 100644
--- a/docs/_tutorials/sparse-attention.md
+++ b/docs/_tutorials/sparse-attention.md
@@ -1,5 +1,5 @@
 ---
-title: "DeepSpeed  Sparse Attention"
+title: "DeepSpeed Sparse Attention"
 tags: training
 ---
 
diff --git a/docs/_tutorials/zero-offload.md b/docs/_tutorials/zero-offload.md
index 7102f0667477..420760f73391 100644
--- a/docs/_tutorials/zero-offload.md
+++ b/docs/_tutorials/zero-offload.md
@@ -1,6 +1,6 @@
 ---
 title: "ZeRO-Offload"
-tags: training IO
+tags: training IO large-model
 ---
 ZeRO-3 Offload consists of a subset of features in our newly released ZeRO-Infinity. Read our [ZeRO-Infinity blog](https://www.microsoft.com/en-us/research/blog/zero-infinity-and-deepspeed-unlocking-unprecedented-model-scale-for-deep-learning-training/) to learn more!
 
diff --git a/docs/_tutorials/zero.md b/docs/_tutorials/zero.md
index 29e5c7f335a1..c84339ece9e5 100644
--- a/docs/_tutorials/zero.md
+++ b/docs/_tutorials/zero.md
@@ -1,7 +1,7 @@
 ---
-title: "Zero Redundancy Optimizer (ZeRO)"
+title: "Zero Redundancy Optimizer"
 excerpt: ""
-tags: training
+tags: training large-model
 ---
 
 If you have not done so already, we advise that you read the DeepSpeed tutorials on [Getting Started](/getting-started/) and [Megatron-LM GPT-2](/tutorials/megatron/) before stepping through this tutorial.
diff --git a/docs/index.md b/docs/index.md
index 30641b011242..685535f63297 100755
--- a/docs/index.md
+++ b/docs/index.md
@@ -167,7 +167,7 @@ Below we provide a brief feature list, see our detailed [feature overview](https
   * Integration with Megatron-LM
 * [Pipeline Parallelism](https://www.deepspeed.ai/tutorials/pipeline/)
   * 3D Parallelism
-* [The Zero Redundancy Optimizer (ZeRO)](https://www.deepspeed.ai/tutorials/zero/)
+* [The Zero Redundancy Optimizer](https://www.deepspeed.ai/tutorials/zero/)
   * Optimizer State and Gradient Partitioning
   * Activation Partitioning
   * Constant Buffer Optimization

From 353aa604cff76ef2581bc5bbe334404bd7b50c1e Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Wed, 2 Mar 2022 05:14:20 +0500
Subject: [PATCH 15/20] fix typo

---
 docs/_sass/minimal-mistakes/_variables.scss | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/_sass/minimal-mistakes/_variables.scss b/docs/_sass/minimal-mistakes/_variables.scss
index 49016db40c9f..e3a1861aa971 100644
--- a/docs/_sass/minimal-mistakes/_variables.scss
+++ b/docs/_sass/minimal-mistakes/_variables.scss
@@ -8,7 +8,7 @@
 
 $doc-font-size: 12 !default;
 
-/* paragraph indention */
+/* paragraph indentation */
 $paragraph-indent: false !default; // true, false (default)
 $indent-var: 1.3em !default;
 

From 5d65837d0f100be58227271fdb0ab016208f52f9 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Wed, 2 Mar 2022 07:10:45 +0500
Subject: [PATCH 16/20] adjust paddings

---
 docs/_posts/2020-09-09-onebit-adam-news.md   |   1 +
 docs/_sass/minimal-mistakes/_archive.scss    | 463 +++++++++++++++++++
 docs/_sass/minimal-mistakes/_navigation.scss |   2 +-
 docs/_sass/minimal-mistakes/_page.scss       |   8 +-
 docs/_sass/minimal-mistakes/_sidebar.scss    | 346 ++++++++++++++
 docs/_sass/minimal-mistakes/_variables.scss  |   4 +-
 docs/_tutorials/onebit-adam.md               |   1 +
 7 files changed, 818 insertions(+), 7 deletions(-)
 create mode 100644 docs/_sass/minimal-mistakes/_archive.scss
 create mode 100644 docs/_sass/minimal-mistakes/_sidebar.scss

diff --git a/docs/_posts/2020-09-09-onebit-adam-news.md b/docs/_posts/2020-09-09-onebit-adam-news.md
index 03b8e1de2fdd..8873f58ca01a 100644
--- a/docs/_posts/2020-09-09-onebit-adam-news.md
+++ b/docs/_posts/2020-09-09-onebit-adam-news.md
@@ -3,6 +3,7 @@ title: "Up to 5x less communication and 3.4x faster training through 1-bit Adam"
 excerpt: ""
 date: 2020-09-09 00:00:00
 tags: training
+toc: false
 ---
 
 
diff --git a/docs/_sass/minimal-mistakes/_archive.scss b/docs/_sass/minimal-mistakes/_archive.scss
new file mode 100644
index 000000000000..af8d7848cfa1
--- /dev/null
+++ b/docs/_sass/minimal-mistakes/_archive.scss
@@ -0,0 +1,463 @@
+/* ==========================================================================
+   ARCHIVE
+   ========================================================================== */
+
+.archive {
+  margin-top: 1em;
+  margin-bottom: 2em;
+
+  @include breakpoint($large) {
+    float: right;
+    width: calc(100% - #{$right-sidebar-width-narrow} - 10%);
+    padding-right: $right-sidebar-width-narrow;
+  }
+
+  @include breakpoint($x-large) {
+    width: calc(100% - #{$right-sidebar-width} - 10%);
+    padding-right: $right-sidebar-width;
+  }
+}
+
+.archive__item {
+  position: relative;
+
+  a {
+    position: relative;
+    z-index: 10;
+  }
+
+  a[rel="permalink"] {
+    position: static;
+  }
+}
+
+.archive__subtitle {
+  margin: 1.414em 0 0.5em;
+  padding-bottom: 0.5em;
+  font-size: $type-size-5;
+  color: $muted-text-color;
+  border-bottom: 1px solid $border-color;
+
+  + .list__item .archive__item-title {
+    margin-top: 0.5em;
+  }
+}
+
+.archive__item-title {
+  margin-bottom: 0.25em;
+  font-family: $sans-serif-narrow;
+  line-height: initial;
+  overflow: hidden;
+  text-overflow: ellipsis;
+
+  a[rel="permalink"]::before {
+    content: '';
+    position: absolute;
+    left: 0;
+    top: 0;
+    right: 0;
+    bottom: 0;
+  }
+
+  a + a {
+    opacity: 0.5;
+  }
+}
+
+/* remove border*/
+.page__content {
+  .archive__item-title {
+    margin-top: 1em;
+    border-bottom: none;
+  }
+}
+
+.archive__item-excerpt {
+  margin-top: 0;
+  font-size: $type-size-6;
+
+  & + p {
+    text-indent: 0;
+  }
+
+  a {
+    position: relative;
+  }
+}
+
+.archive__item-teaser {
+  position: relative;
+  border-radius: $border-radius;
+  overflow: hidden;
+
+  img {
+    width: 100%;
+  }
+}
+
+.archive__item-caption {
+  position: absolute;
+  bottom: 0;
+  right: 0;
+  margin: 0 auto;
+  padding: 2px 5px;
+  color: #fff;
+  font-family: $caption-font-family;
+  font-size: $type-size-8;
+  background: #000;
+  text-align: right;
+  z-index: 5;
+  opacity: 0.5;
+  border-radius: $border-radius 0 0 0;
+
+  @include breakpoint($large) {
+    padding: 5px 10px;
+  }
+
+  a {
+    color: #fff;
+    text-decoration: none;
+  }
+}
+
+/*
+   List view
+   ========================================================================== */
+
+.list__item {
+  .page__meta {
+    margin: 0 0 4px;
+    font-size: 0.6em;
+  }
+}
+
+/*
+   Grid view
+   ========================================================================== */
+
+.archive {
+  .grid__wrapper {
+    /* extend grid elements to the right */
+
+    @include breakpoint($large) {
+      margin-right: -1 * $right-sidebar-width-narrow;
+    }
+
+    @include breakpoint($x-large) {
+      margin-right: -1 * $right-sidebar-width;
+    }
+  }
+}
+
+.grid__item {
+  margin-bottom: 2em;
+
+  @include breakpoint($small) {
+    float: left;
+    width: span(5 of 10);
+
+    &:nth-child(2n + 1) {
+      clear: both;
+      margin-left: 0;
+    }
+
+    &:nth-child(2n + 2) {
+      clear: none;
+      margin-left: gutter(of 10);
+    }
+  }
+
+  @include breakpoint($medium) {
+    margin-left: 0; /* override margin*/
+    margin-right: 0; /* override margin*/
+    width: span(3 of 12);
+
+    &:nth-child(2n + 1) {
+      clear: none;
+    }
+
+    &:nth-child(4n + 1) {
+      clear: both;
+    }
+
+    &:nth-child(4n + 2) {
+      clear: none;
+      margin-left: gutter(1 of 12);
+    }
+
+    &:nth-child(4n + 3) {
+      clear: none;
+      margin-left: gutter(1 of 12);
+    }
+
+    &:nth-child(4n + 4) {
+      clear: none;
+      margin-left: gutter(1 of 12);
+    }
+  }
+
+  .page__meta {
+    margin: 0 0 4px;
+    font-size: 0.6em;
+  }
+
+  .page__meta-sep {
+    display: block;
+
+    &::before {
+      display: none;
+    }
+  }
+
+  .archive__item-title {
+    margin-top: 0.5em;
+    font-size: $type-size-5;
+  }
+
+  .archive__item-excerpt {
+    display: none;
+
+    @include breakpoint($medium) {
+      display: block;
+      font-size: $type-size-6;
+    }
+  }
+
+  .archive__item-teaser {
+    @include breakpoint($small) {
+      max-height: 200px;
+    }
+
+    @include breakpoint($medium) {
+      max-height: 120px;
+    }
+  }
+}
+
+/*
+   Features
+   ========================================================================== */
+
+.feature__wrapper {
+  @include clearfix();
+  margin-bottom: 2em;
+  border-bottom: 1px solid $border-color;
+
+  .archive__item-title {
+    margin-bottom: 0;
+  }
+}
+
+.feature__item {
+  position: relative;
+  margin-bottom: 2em;
+  font-size: 1.125em;
+
+  @include breakpoint($small) {
+    float: left;
+    margin-bottom: 0;
+    width: span(4 of 12);
+
+    &:nth-child(3n + 1) {
+      clear: both;
+      margin-left: 0;
+    }
+
+    &:nth-child(3n + 2) {
+      clear: none;
+      margin-left: gutter(of 12);
+    }
+
+    &:nth-child(3n + 3) {
+      clear: none;
+      margin-left: gutter(of 12);
+    }
+
+    .feature__item-teaser {
+      max-height: 200px;
+      overflow: hidden;
+    }
+  }
+
+  .archive__item-body {
+    padding-left: gutter(1 of 12);
+    padding-right: gutter(1 of 12);
+  }
+
+  a.btn::before {
+    content: '';
+    position: absolute;
+    left: 0;
+    top: 0;
+    right: 0;
+    bottom: 0;
+  }
+
+  &--left {
+    position: relative;
+    float: left;
+    margin-left: 0;
+    margin-right: 0;
+    width: 100%;
+    clear: both;
+    font-size: 1.125em;
+
+    .archive__item {
+      float: left;
+    }
+
+    .archive__item-teaser {
+      margin-bottom: 2em;
+    }
+
+    a.btn::before {
+      content: '';
+      position: absolute;
+      left: 0;
+      top: 0;
+      right: 0;
+      bottom: 0;
+    }
+
+    @include breakpoint($small) {
+      .archive__item-teaser {
+        float: left;
+        width: span(5 of 12);
+      }
+
+      .archive__item-body {
+        float: right;
+        padding-left: gutter(0.5 of 12);
+        padding-right: gutter(1 of 12);
+        width: span(7 of 12);
+      }
+    }
+  }
+
+  &--right {
+    position: relative;
+    float: left;
+    margin-left: 0;
+    margin-right: 0;
+    width: 100%;
+    clear: both;
+    font-size: 1.125em;
+
+    .archive__item {
+      float: left;
+    }
+
+    .archive__item-teaser {
+      margin-bottom: 2em;
+    }
+
+    a.btn::before {
+      content: '';
+      position: absolute;
+      left: 0;
+      top: 0;
+      right: 0;
+      bottom: 0;
+    }
+
+    @include breakpoint($small) {
+      text-align: right;
+
+      .archive__item-teaser {
+        float: right;
+        width: span(5 of 12);
+      }
+
+      .archive__item-body {
+        float: left;
+        width: span(7 of 12);
+        padding-left: gutter(0.5 of 12);
+        padding-right: gutter(1 of 12);
+      }
+    }
+  }
+
+  &--center {
+    position: relative;
+    float: left;
+    margin-left: 0;
+    margin-right: 0;
+    width: 100%;
+    clear: both;
+    font-size: 1.125em;
+
+    .archive__item {
+      float: left;
+      width: 100%;
+    }
+
+    .archive__item-teaser {
+      margin-bottom: 2em;
+    }
+
+    a.btn::before {
+      content: '';
+      position: absolute;
+      left: 0;
+      top: 0;
+      right: 0;
+      bottom: 0;
+    }
+
+    @include breakpoint($small) {
+      text-align: center;
+
+      .archive__item-teaser {
+        margin: 0 auto;
+        width: span(5 of 12);
+      }
+
+      .archive__item-body {
+        margin: 0 auto;
+        width: span(7 of 12);
+      }
+    }
+  }
+}
+
+/* Place inside an archive layout */
+
+.archive {
+  .feature__wrapper {
+    .archive__item-title {
+      margin-top: 0.25em;
+      font-size: 1em;
+    }
+  }
+
+  .feature__item,
+  .feature__item--left,
+  .feature__item--center,
+  .feature__item--right {
+    font-size: 1em;
+  }
+}
+
+/*
+   Wide Pages
+   ========================================================================== */
+
+  .wide {
+  .archive {
+    @include breakpoint($large) {
+      padding-right: 0;
+    }
+
+    @include breakpoint($x-large) {
+      padding-right: 0;
+    }
+  }
+}
+
+/* Place inside a single layout */
+
+.layout--single {
+	.feature__wrapper {
+		display: inline-block;
+	}
+}
diff --git a/docs/_sass/minimal-mistakes/_navigation.scss b/docs/_sass/minimal-mistakes/_navigation.scss
index 5505714219bb..4909c2d44add 100644
--- a/docs/_sass/minimal-mistakes/_navigation.scss
+++ b/docs/_sass/minimal-mistakes/_navigation.scss
@@ -200,7 +200,7 @@
       margin-left: 0;
     }
   }
-
+  
   img{
     -webkit-transition: none;
     transition: none;
diff --git a/docs/_sass/minimal-mistakes/_page.scss b/docs/_sass/minimal-mistakes/_page.scss
index 06fef675dbb5..4f72e7ff7320 100644
--- a/docs/_sass/minimal-mistakes/_page.scss
+++ b/docs/_sass/minimal-mistakes/_page.scss
@@ -50,9 +50,9 @@ body {
   .page__inner-wrap {
     float: left;
     margin-top: 1em;
-    margin-left: 0;
-    margin-right: 0;
-    width: 100%;
+    margin-left: 10%;
+    margin-right: 0%;
+    width: 80%;
     clear: both;
 
     .page__content,
@@ -61,7 +61,7 @@ body {
       position: relative;
       float: left;
       margin-left: 0;
-      margin-right: 0;
+      margin-right: 10%;
       width: 100%;
       clear: both;
     }
diff --git a/docs/_sass/minimal-mistakes/_sidebar.scss b/docs/_sass/minimal-mistakes/_sidebar.scss
new file mode 100644
index 000000000000..b4e469e93b90
--- /dev/null
+++ b/docs/_sass/minimal-mistakes/_sidebar.scss
@@ -0,0 +1,346 @@
+/* ==========================================================================
+   SIDEBAR
+   ========================================================================== */
+
+/*
+   Default
+   ========================================================================== */
+
+.sidebar {
+  @include clearfix();
+  // @include breakpoint(max-width $large) {
+  //   /* fix z-index order of follow links */
+  //   position: relative;
+  //   z-index: 10;
+  //   -webkit-transform: translate3d(0, 0, 0);
+  //   transform: translate3d(0, 0, 0);
+  // }
+
+  @include breakpoint($large) {
+    float: left;
+    width: calc(#{$right-sidebar-width-narrow} - 1em);
+    opacity: 0.75;
+    -webkit-transition: opacity 0.2s ease-in-out;
+    transition: opacity 0.2s ease-in-out;
+
+    &:hover {
+      opacity: 1;
+    }
+
+    &.sticky {
+      overflow-y: auto;
+      /* calculate height of nav list
+         viewport height - nav height - masthead x-padding
+      */
+      max-height: calc(100vh - #{$nav-height} - 2em);
+    }
+  }
+
+  @include breakpoint($x-large) {
+    width: calc(#{$right-sidebar-width} - 1em);
+  }
+
+  > * {
+    margin-top: 1em;
+    margin-bottom: 1em;
+  }
+
+  h2,
+  h3,
+  h4,
+  h5,
+  h6 {
+    margin-bottom: 0;
+    font-family: $sans-serif-narrow;
+  }
+
+  p,
+  li {
+    font-family: $sans-serif;
+    font-size: $type-size-6;
+    line-height: 1.5;
+  }
+
+  img {
+    width: 100%;
+
+    &.emoji {
+      width: 20px;
+      height: 20px;
+    }
+  }
+}
+
+.sidebar__right {
+  margin-bottom: 1em;
+
+  @include breakpoint($large) {
+    position: absolute;
+    top: 0;
+    right: 0;
+    width: $right-sidebar-width-narrow;
+    margin-right: -1.5 * $right-sidebar-width-narrow;
+    padding-left: 1em;
+    z-index: 10;
+
+    &.sticky {
+      @include clearfix();
+      position: -webkit-sticky;
+      position: sticky;
+      top: 2em;
+      float: right;
+    }
+  }
+
+  @include breakpoint($x-large) {
+    width: $right-sidebar-width;
+    margin-right: -1.5 * $right-sidebar-width;
+  }
+}
+
+.splash .sidebar__right {
+  @include breakpoint($large) {
+    position: relative;
+    float: right;
+    margin-right: 0;
+  }
+
+  @include breakpoint($x-large) {
+    margin-right: 0;
+  }
+}
+
+/*
+   Author profile and links
+   ========================================================================== */
+
+.author__avatar {
+  display: table-cell;
+  vertical-align: top;
+  width: 36px;
+  height: 36px;
+
+  @include breakpoint($large) {
+    display: block;
+    width: auto;
+    height: auto;
+  }
+
+  img {
+    max-width: 110px;
+    border-radius: 50%;
+
+    @include breakpoint($large) {
+      padding: 5px;
+      border: 1px solid $border-color;
+    }
+  }
+}
+
+.author__content {
+  display: table-cell;
+  vertical-align: top;
+  padding-left: 15px;
+  padding-right: 25px;
+  line-height: 1;
+
+  @include breakpoint($large) {
+    display: block;
+    width: 100%;
+    padding-left: 0;
+    padding-right: 0;
+  }
+
+  a {
+    color: inherit;
+    text-decoration: none;
+  }
+}
+
+.author__name {
+  margin: 0;
+
+  @include breakpoint($large) {
+    margin-top: 10px;
+    margin-bottom: 10px;
+  }
+}
+.sidebar .author__name {
+  font-family: $sans-serif;
+  font-size: $type-size-5;
+}
+
+.author__bio {
+  margin: 0;
+
+  @include breakpoint($large) {
+    margin-top: 10px;
+    margin-bottom: 20px;
+  }
+}
+
+.author__urls-wrapper {
+  position: relative;
+  display: table-cell;
+  vertical-align: middle;
+  font-family: $sans-serif;
+  z-index: 20;
+  cursor: pointer;
+
+  li:last-child {
+    a {
+      margin-bottom: 0;
+    }
+  }
+
+  .author__urls {
+    span.label {
+      padding-left: 5px;
+    }
+  }
+
+  @include breakpoint($large) {
+    display: block;
+  }
+
+  button {
+    position: relative;
+    margin-bottom: 0;
+
+    &:before {
+      @supports (pointer-events: none) {
+        content: '';
+        position: fixed;
+        top: 0;
+        left: 0;
+        width: 100%;
+        height: 100%;
+        pointer-events: none;
+      }
+    }
+
+    &.open {
+      &:before {
+        pointer-events: auto;
+      }
+    }
+
+    @include breakpoint($large) {
+      display: none;
+    }
+  }
+}
+
+.author__urls {
+  display: none;
+  position: absolute;
+  right: 0;
+  margin-top: 15px;
+  padding: 10px;
+  list-style-type: none;
+  border: 1px solid $border-color;
+  border-radius: $border-radius;
+  background: $background-color;
+  box-shadow: 0 2px 4px 0 rgba(#000, 0.16), 0 2px 10px 0 rgba(#000, 0.12);
+  cursor: default;
+
+  &.is--visible {
+    display: block;
+  }
+
+  @include breakpoint($large) {
+    display: block;
+    position: relative;
+    margin: 0;
+    padding: 0;
+    border: 0;
+    background: transparent;
+    box-shadow: none;
+  }
+
+  &:before {
+    display: block;
+    content: "";
+    position: absolute;
+    top: -11px;
+    left: calc(50% - 10px);
+    width: 0;
+    border-style: solid;
+    border-width: 0 10px 10px;
+    border-color: $border-color transparent;
+    z-index: 0;
+
+    @include breakpoint($large) {
+      display: none;
+    }
+  }
+
+  &:after {
+    display: block;
+    content: "";
+    position: absolute;
+    top: -10px;
+    left: calc(50% - 10px);
+    width: 0;
+    border-style: solid;
+    border-width: 0 10px 10px;
+    border-color: $background-color transparent;
+    z-index: 1;
+
+    @include breakpoint($large) {
+      display: none;
+    }
+  }
+
+  ul {
+    padding: 10px;
+    list-style-type: none;
+  }
+
+  li {
+    white-space: nowrap;
+  }
+
+  a {
+    display: block;
+    margin-bottom: 5px;
+    padding-right: 5px;
+    padding-top: 2px;
+    padding-bottom: 2px;
+    color: inherit;
+    font-size: $type-size-5;
+    text-decoration: none;
+
+    &:hover {
+      text-decoration: underline;
+    }
+  }
+}
+
+/*
+   Wide Pages
+   ========================================================================== */
+
+.wide .sidebar__right {
+  margin-bottom: 1em;
+
+  @include breakpoint($large) {
+    position: initial;
+    top: initial;
+    right: initial;
+    width: initial;
+    margin-right: initial;
+    padding-left: initial;
+    z-index: initial;
+
+    &.sticky {
+      float: none;
+    }
+  }
+
+  @include breakpoint($x-large) {
+    width: initial;
+    margin-right: initial;
+  }
+}
+
diff --git a/docs/_sass/minimal-mistakes/_variables.scss b/docs/_sass/minimal-mistakes/_variables.scss
index e3a1861aa971..b21b02fac976 100644
--- a/docs/_sass/minimal-mistakes/_variables.scss
+++ b/docs/_sass/minimal-mistakes/_variables.scss
@@ -6,7 +6,7 @@
    Typography
    ========================================================================== */
 
-$doc-font-size: 12 !default;
+$doc-font-size: 15 !default;
 
 /* paragraph indentation */
 $paragraph-indent: false !default; // true, false (default)
@@ -144,7 +144,7 @@ $small: 600px !default;
 $medium: 768px !default;
 $medium-wide: 900px !default;
 $large: 1024px !default;
-$x-large: 2560px !default;
+$x-large: 1280x !default;
 $max-width: $x-large !default;
 
 /*
diff --git a/docs/_tutorials/onebit-adam.md b/docs/_tutorials/onebit-adam.md
index 20df2b99d9fb..36564d38514a 100644
--- a/docs/_tutorials/onebit-adam.md
+++ b/docs/_tutorials/onebit-adam.md
@@ -1,6 +1,7 @@
 ---
 title: "1-bit Adam: Up to 5x less communication volume and up to 3.4x faster training"
 tags: training IO
+toc: false
 ---
 
 **Note:**

From 430b3f7834e59029a52c3f47e829469c64b901f7 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Wed, 2 Mar 2022 07:11:15 +0500
Subject: [PATCH 17/20] fix format

---
 docs/_sass/minimal-mistakes/_navigation.scss | 2 +-
 docs/_sass/minimal-mistakes/_sidebar.scss    | 1 -
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/docs/_sass/minimal-mistakes/_navigation.scss b/docs/_sass/minimal-mistakes/_navigation.scss
index 4909c2d44add..5505714219bb 100644
--- a/docs/_sass/minimal-mistakes/_navigation.scss
+++ b/docs/_sass/minimal-mistakes/_navigation.scss
@@ -200,7 +200,7 @@
       margin-left: 0;
     }
   }
-  
+
   img{
     -webkit-transition: none;
     transition: none;
diff --git a/docs/_sass/minimal-mistakes/_sidebar.scss b/docs/_sass/minimal-mistakes/_sidebar.scss
index b4e469e93b90..63cef338c583 100644
--- a/docs/_sass/minimal-mistakes/_sidebar.scss
+++ b/docs/_sass/minimal-mistakes/_sidebar.scss
@@ -343,4 +343,3 @@
     margin-right: initial;
   }
 }
-

From 4674086a194a2c34acc3dd052f00d05be965dcbc Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Sat, 5 Mar 2022 07:27:23 +0500
Subject: [PATCH 18/20] limit max width of page content

---
 docs/_sass/minimal-mistakes/_page.scss | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/_sass/minimal-mistakes/_page.scss b/docs/_sass/minimal-mistakes/_page.scss
index 4f72e7ff7320..00f3dca17789 100644
--- a/docs/_sass/minimal-mistakes/_page.scss
+++ b/docs/_sass/minimal-mistakes/_page.scss
@@ -55,7 +55,10 @@ body {
     width: 80%;
     clear: both;
 
-    .page__content,
+    .page__content {
+      float: center;
+      max-width: 1280px;
+    }
     .page__meta,
     .page__share {
       position: relative;

From 7210b4193070f95821d1c6b40361d3e2732ad460 Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Sat, 12 Mar 2022 04:11:20 +0500
Subject: [PATCH 19/20] tune page width

---
 docs/_sass/minimal-mistakes.scss            | 24 ---------------------
 docs/_sass/minimal-mistakes/_page.scss      |  2 ++
 docs/_sass/minimal-mistakes/_variables.scss |  9 ++++++--
 3 files changed, 9 insertions(+), 26 deletions(-)

diff --git a/docs/_sass/minimal-mistakes.scss b/docs/_sass/minimal-mistakes.scss
index 7f25575784dd..1a1f9965c054 100644
--- a/docs/_sass/minimal-mistakes.scss
+++ b/docs/_sass/minimal-mistakes.scss
@@ -39,27 +39,3 @@
 @import "minimal-mistakes/sidebar";
 @import "minimal-mistakes/print";
 
-
-.wide2 {
-    .page {
-      float: left;
-      width: 115%;
-      @include breakpoint($large) {
-        padding-left: 15%;
-      }
-
-      @include breakpoint($x-large) {
-        padding-left: 15%;
-      }
-    }
-
-    .page__related {
-      @include breakpoint($large) {
-        padding-left: 15%;
-      }
-
-      @include breakpoint($x-large) {
-        padding-left: 15%;
-      }
-    }
-  }
diff --git a/docs/_sass/minimal-mistakes/_page.scss b/docs/_sass/minimal-mistakes/_page.scss
index 00f3dca17789..7632b5f412b4 100644
--- a/docs/_sass/minimal-mistakes/_page.scss
+++ b/docs/_sass/minimal-mistakes/_page.scss
@@ -54,6 +54,8 @@ body {
     margin-right: 0%;
     width: 80%;
     clear: both;
+    max-width: 1280px;
+
 
     .page__content {
       float: center;
diff --git a/docs/_sass/minimal-mistakes/_variables.scss b/docs/_sass/minimal-mistakes/_variables.scss
index b21b02fac976..f69086b49517 100644
--- a/docs/_sass/minimal-mistakes/_variables.scss
+++ b/docs/_sass/minimal-mistakes/_variables.scss
@@ -6,7 +6,7 @@
    Typography
    ========================================================================== */
 
-$doc-font-size: 15 !default;
+$doc-font-size: 16 !default;
 
 /* paragraph indentation */
 $paragraph-indent: false !default; // true, false (default)
@@ -118,6 +118,11 @@ $masthead-link-color: $primary-color !default;
 $masthead-link-color-hover: mix(#000, $primary-color, 25%) !default;
 $navicon-link-color-hover: mix(#fff, $primary-color, 75%) !default;
 
+/* notices */
+$notice-background-mix: 80% !default;
+$code-notice-background-mix: 90% !default;
+
+
 /* syntax highlighting (base16) */
 $base00: #263238 !default;
 $base01: #2e3c43 !default;
@@ -144,7 +149,7 @@ $small: 600px !default;
 $medium: 768px !default;
 $medium-wide: 900px !default;
 $large: 1024px !default;
-$x-large: 1280x !default;
+$x-large: 1920px !default;
 $max-width: $x-large !default;
 
 /*

From f50ce395541bec01ba4447bb5ca25994007003fd Mon Sep 17 00:00:00 2001
From: Cheng Li <pistasable@gmail.com>
Date: Sat, 12 Mar 2022 04:12:06 +0500
Subject: [PATCH 20/20] fix format

---
 docs/_sass/minimal-mistakes.scss | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/_sass/minimal-mistakes.scss b/docs/_sass/minimal-mistakes.scss
index 1a1f9965c054..4df5f7de7918 100644
--- a/docs/_sass/minimal-mistakes.scss
+++ b/docs/_sass/minimal-mistakes.scss
@@ -38,4 +38,3 @@
 @import "minimal-mistakes/archive";
 @import "minimal-mistakes/sidebar";
 @import "minimal-mistakes/print";
-