Merge branch 'main' into jiannanWang/examples

jiannanWang · web-flow · commit 4dba7db84f95 · 2025-09-29T12:31:57.000-07:00
diff --git a/advanced_source/semi_structured_sparse.py b/advanced_source/semi_structured_sparse.py
@@ -43,6 +43,8 @@
 # -  A NVIDIA GPU with semi-structured sparsity support (Compute
 #    Capability 8.0+).
 #
+#  .. note:: This tutorial is tested on an NVIDIA A100 80GB GPU. You may not see similar speedups on newer GPU architectures, For the latest information on semi-structured sparsity support, please refer to the README `here <https://github.com/pytorch/ao/tree/main/torchao/sparsity#torchao-sparsity>
+#
 # This tutorial is designed for beginners to semi-structured sparsity and
 # sparsity in general. For users with existing 2:4 sparse models,
 # accelerating ``nn.Linear`` layers for inference with
@@ -52,7 +54,6 @@
 import torch
 from torch.sparse import to_sparse_semi_structured, SparseSemiStructuredTensor
 from torch.utils.benchmark import Timer
-SparseSemiStructuredTensor._FORCE_CUTLASS = True
 
 # mask Linear weight to be 2:4 sparse
 mask = torch.Tensor([0, 0, 1, 1]).tile((3072, 2560)).cuda().bool()
@@ -207,7 +208,6 @@
 import transformers
 
 # force CUTLASS use if ``cuSPARSELt`` is not available
-SparseSemiStructuredTensor._FORCE_CUTLASS = True
 torch.manual_seed(100)
 
 # Set default device to "cuda:0"
diff --git a/redirects.py b/redirects.py
@@ -48,6 +48,7 @@
     "recipes/torchserve_vertexai_tutorial.html": "../index.html",
     "recipes/amx.html": "../index.html",
     "unstable_source/vulkan_workflow.rst": "../index.html",
+    "unstable/semi_structured_sparse.html": "https://docs.pytorch.org/tutorials/advanced/semi_structured_sparse.html",
     "unstable/skip_param_init.html": "https://docs.pytorch.org/tutorials/recipes/recipes/module_load_state_dict_tips.html",
     "unstable_source/backend_config_tutorial.rst": "../index.html",
 }
diff --git a/unstable_index.rst b/unstable_index.rst
@@ -36,15 +36,6 @@ decide if we want to upgrade the level of commitment or to fail fast.
 
 .. Add prototype tutorial cards below this line
 
-.. Sparsity
-
-.. customcarditem::
-   :header: (prototype) Accelerating BERT with semi-structured (2:4) sparsity
-   :card_description: Prune BERT to be 2:4 sparse and accelerate for inference.
-   :image: _static/img/thumbnails/cropped/generic-pytorch-logo.png
-   :link: unstable/semi_structured_sparse.html
-   :tags: Model-Optimiziation
-
 .. vmap
 
 .. customcarditem::
diff --git a/unstable_source/semi_structured_sparse.rst b/unstable_source/semi_structured_sparse.rst

Original file line number	Diff line number	Diff line change
`@@ -48,6 +48,7 @@`
`48`	`48`	`"recipes/torchserve_vertexai_tutorial.html": "../index.html",`
`49`	`49`	`"recipes/amx.html": "../index.html",`
`50`	`50`	`"unstable_source/vulkan_workflow.rst": "../index.html",`
	`51`	`+ "unstable/semi_structured_sparse.html": "https://docs.pytorch.org/tutorials/advanced/semi_structured_sparse.html",`
`51`	`52`	`"unstable/skip_param_init.html": "https://docs.pytorch.org/tutorials/recipes/recipes/module_load_state_dict_tips.html",`
`52`	`53`	`"unstable_source/backend_config_tutorial.rst": "../index.html",`
`53`	`54`	`}`