Revise sparse docs regarding Sparse Compressed tensors (#82108)

Pull Request resolved: https://github.com/pytorch/pytorch/pull/82108 Approved by: https://github.com/bhosmer
2026-05-14 20:57:59 +00:00 · 2022-07-29 17:52:37 +03:00 · 2022-07-29 17:52:37 +03:00 · ff5399e528
commit ff5399e528
parent 8def154e00
5 changed files with 625 additions and 146 deletions
--- a/aten/src/ATen/native/sparse/SparseCsrTensor.cpp
+++ b/aten/src/ATen/native/sparse/SparseCsrTensor.cpp
@ -165,15 +165,15 @@ void _validate_sparse_compressed_tensor_args_worker(const Tensor& compressed_ind
  }
  const int nrows = size[batch_ndim] / blocksize[0];
  const int ncols = size[batch_ndim + 1] / blocksize[1];
-  int ncompressed_dims, nplain_dims;
-  std::tie(ncompressed_dims, nplain_dims) = AT_DISPATCH_ROW_SPARSE_COMPRESSED_LAYOUTS(layout, "validate_sparse_compressed_tensor_args",
-                                                                                      [&] { return std::make_tuple(nrows, ncols); },
-                                                                                      [&] { return std::make_tuple(ncols, nrows); });
+  int compressed_dim_size, plain_dim_size;
+  std::tie(compressed_dim_size, plain_dim_size) = AT_DISPATCH_ROW_SPARSE_COMPRESSED_LAYOUTS(layout, "validate_sparse_compressed_tensor_args",
+                                                                                            [&] { return std::make_tuple(nrows, ncols); },
+                                                                                            [&] { return std::make_tuple(ncols, nrows); });
  // 3.8
  TORCH_CHECK(
-              compressed_indices.size(-1) == ncompressed_dims + 1,
+              compressed_indices.size(-1) == compressed_dim_size + 1,
              compressed_indices_name, ".shape[-1] must be equal to the number of ",
-              compressed_dim_name, "s + 1 (=", ncompressed_dims + 1, "), but got ", compressed_indices.size(-1));
+              compressed_dim_name, "s + 1 (=", compressed_dim_size + 1, "), but got ", compressed_indices.size(-1));
  // 3.9, 3.10
  TORCH_CHECK(
              plain_indices.size(-1) == values_nnz,
@ -198,8 +198,8 @@ void _validate_sparse_compressed_tensor_args_worker(const Tensor& compressed_ind
        /*is_crow = */layout == kSparseCsr || layout == kSparseBsr,
        compressed_indices,
        plain_indices,
-        ncompressed_dims,
-        nplain_dims,
+        compressed_dim_size,
+        plain_dim_size,
        values_nnz
    );
  }
@ -357,23 +357,23 @@ DimVector _estimate_sparse_compressed_tensor_size(
                      (block_ndim == 2 ? std::max<int64_t>(1, values.size(batch_ndim + 2)) : 1)
  };
  DimVector size = DimVector(compressed_indices.sizes().slice(0, batch_ndim));
-  int64_t ncompressed_dims = (compressed_indices.dim() > 0 && compressed_indices.size(-1) > 0 ? compressed_indices.size(-1) - 1 : 0);
-  int64_t nplain_dims = AT_DISPATCH_INTEGRAL_TYPES(plain_indices.scalar_type(), "estimate_sparse_compressed_tensor_size",
-                                                   [&]() -> int64_t {
-                                                     if (plain_indices.numel() > 0) {
-                                                       return plain_indices.max().item<scalar_t>() + 1;
-                                                     } else {
-                                                       return 0;
-                                                     }
-                                                   });
+  int64_t compressed_dim_size = (compressed_indices.dim() > 0 && compressed_indices.size(-1) > 0 ? compressed_indices.size(-1) - 1 : 0);
+  int64_t plain_dim_size = AT_DISPATCH_INTEGRAL_TYPES(plain_indices.scalar_type(), "estimate_sparse_compressed_tensor_size",
+                                                      [&]() -> int64_t {
+                                                        if (plain_indices.numel() > 0) {
+                                                          return plain_indices.max().item<scalar_t>() + 1;
+                                                        } else {
+                                                          return 0;
+                                                        }
+                                                      });
  AT_DISPATCH_ROW_SPARSE_COMPRESSED_LAYOUTS(layout, "estimate_sparse_compressed_tensor_size",
      [&]{
-        size.push_back(ncompressed_dims * blocksize[0]);
-        size.push_back(nplain_dims * blocksize[1]);
+        size.push_back(compressed_dim_size * blocksize[0]);
+        size.push_back(plain_dim_size * blocksize[1]);
      },
      [&]{
-        size.push_back(nplain_dims * blocksize[0]);
-        size.push_back(ncompressed_dims * blocksize[1]);
+        size.push_back(plain_dim_size * blocksize[0]);
+        size.push_back(compressed_dim_size * blocksize[1]);
      });
  for (int i=0; i<dense_ndim; i++) {
    int64_t j = batch_ndim + 1 + base_ndim + i;
--- a/docs/source/sparse.rst
+++ b/docs/source/sparse.rst
@ -23,7 +23,10 @@ as processor resources can be spared if only the non-zero elements are
 stored or/and processed. Various sparse storage formats (`such as COO,
 CSR/CSC, LIL, etc.`__) have been developed that are optimized for a
 particular structure of non-zero elements in sparse arrays as well as
-for specific operations on the arrays.
+for specific operations on the arrays. PyTorch supports the following
+sparse storage formats: :ref:`COO<sparse-coo-docs>`,
+:ref:`CSR<sparse-csr-docs>`, :ref:`CSC<sparse-csc-docs>`,
+:ref:`BSR<sparse-bsr-docs>`, and :ref:`BSC<sparse-bsc-docs>`.

 __ https://en.wikipedia.org/wiki/Sparse_matrix

@ -136,7 +139,7 @@ only:

 .. _sparse-hybrid-coo-docs:

-Hybrid sparse COO tensors
+Sparse hybrid COO tensors
 -------------------------

 Pytorch implements an extension of sparse tensors with scalar values
@ -157,8 +160,8 @@ have:

 .. note::

-   We use (M + K)-dimensional tensor to denote a N-dimensional hybrid
-   sparse tensor, where M and K are the numbers of sparse and dense
+   We use (M + K)-dimensional tensor to denote a N-dimensional sparse
+   hybrid tensor, where M and K are the numbers of sparse and dense
   dimensions, respectively, such that M + K == N holds.

 Suppose we want to create a (2 + 1)-dimensional tensor with the entry
@ -208,7 +211,7 @@ invariants:
 Uncoalesced sparse COO tensors
 ------------------------------

-PyTorch sparse COO tensor format permits *uncoalesced* sparse tensors,
+PyTorch sparse COO tensor format permits sparse *uncoalesced* tensors,
 where there may be duplicate coordinates in the indices; in this case,
 the interpretation is that the value at that index is the sum of all
 duplicate value entries. For example, one can specify multiple values,
@ -242,7 +245,7 @@ sparse tensor with the following properties:

  For the most part, you shouldn't have to care whether or not a
  sparse tensor is coalesced or not, as most operations will work
-  identically given a coalesced or uncoalesced sparse tensor.
+  identically given a sparse coalesced or uncoalesced tensor.

  However, some operations can be implemented more efficiently on
  uncoalesced tensors, and some on coalesced tensors.
@ -340,7 +343,7 @@ When working with uncoalesced sparse COO tensors, one must take into
 an account the additive nature of uncoalesced data: the values of the
 same indices are the terms of a sum that evaluation gives the value of
 the corresponding tensor element. For example, the scalar
-multiplication on an uncoalesced sparse tensor could be implemented by
+multiplication on a sparse uncoalesced tensor could be implemented by
 multiplying all the uncoalesced values with the scalar because ``c *
 (a + b) == c * a + c * b`` holds. However, any nonlinear operation,
 say, a square root, cannot be implemented by applying the operation to
@ -370,49 +373,143 @@ assumption that the fill value is negative infinity.

 .. See https://github.com/Quansight-Labs/rfcs/tree/pearu/rfc-fill-value/RFC-0004-sparse-fill-value for a new API

-.. _sparse-csr-docs:
+.. _sparse-compressed-docs:

-Sparse CSR Tensor
-+++++++++++++++++
+Sparse Compressed Tensors
+++++++++++++++++++++++++

-The CSR (Compressed Sparse Row) sparse tensor format implements the CSR format
-for storage of 2 dimensional tensors. Although there is no support for N-dimensional
-tensors, the primary advantage over the COO format is better use of storage and
-much faster computation operations such as sparse matrix-vector multiplication
-using MKL and MAGMA backends. CUDA support does not exist as of now.
+Sparse Compressed Tensors represents a class of sparse tensors that
+have a common feature of compressing the indices of a certain dimension
+using an encoding that enables certain optimizations on linear algebra
+kernels of sparse compressed tensors. This encoding is based on the
+`Compressed Sparse Row (CSR)`__ format that PyTorch sparse compressed
+tensors extend with the support of sparse tensor batches, allowing
+multi-dimensional tensor values, and storing sparse tensor values in
+dense blocks.

-A CSR sparse tensor consists of three 1-D tensors: ``crow_indices``, ``col_indices``
-and ``values``:
-
-  - The ``crow_indices`` tensor consists of compressed row indices. This is a 1-D tensor
-    of size ``size[0] + 1``. The last element is the number of non-zeros. This tensor
-    encodes the index in ``values`` and ``col_indices`` depending on where the given row
-    starts. Each successive number in the tensor subtracted by the number before it denotes
-    the number of elements in a given row.
-  - The ``col_indices`` tensor contains the column indices of each value. This is a 1-D
-    tensor of size ``nnz``.
-  - The ``values`` tensor  contains the values of the CSR tensor. This is a 1-D tensor
-    of size ``nnz``.
+__ https://en.wikipedia.org/wiki/Sparse_matrix#Compressed_sparse_row_(CSR,_CRS_or_Yale_format)

 .. note::

-   The index tensors ``crow_indices`` and ``col_indices`` should have element type either
-   ``torch.int64`` (default) or ``torch.int32``. If you want to use MKL-enabled matrix
-   operations, use ``torch.int32``. This is as a result of the default linking of pytorch
-   being with MKL LP64, which uses 32 bit integer indexing.
+   We use (B + M + K)-dimensional tensor to denote a N-dimensional
+   sparse compressed hybrid tensor, where B, M, and K are the numbers
+   of batch, sparse, and dense dimensions, respectively, such that
+   ``B + M + K == N`` holds. The number of sparse dimensions for
+   sparse compressed tensors is always two, ``M == 2``.
+
+.. note::
+
+   We say that an indices tensor ``compressed_indices`` uses CSR
+   encoding if the following invariants are satisfied:
+
+   - ``compressed_indices`` is a contiguous strided 32 or 64 bit
+     integer tensor
+   - ``compressed_indices`` shape is ``(*batchsize,
+     compressed_dim_size + 1)`` where ``compressed_dim_size`` is the
+     number of compressed dimensions (e.g. rows or columns)
+   - ``compressed_indices[..., 0] == 0`` where ``...`` denotes batch
+     indices
+   - ``compressed_indices[..., compressed_dim_size] == nse`` where
+     ``nse`` is the number of specified elements
+   - ``0 <= compressed_indices[..., i] - compressed_indices[..., i -
+     1] <= plain_dim_size`` for ``i=1, ..., compressed_dim_size``,
+     where ``plain_dim_size`` is the number of plain dimensions
+     (orthogonal to compressed dimensions, e.g. columns or rows).
+
+.. _sparse-csr-docs:
+
+Sparse CSR Tensor
+-----------------
+
+The primary advantage of the CSR format over the COO format is better
+use of storage and much faster computation operations such as sparse
+matrix-vector multiplication using MKL and MAGMA backends.
+
+In the simplest case, a (0 + 2 + 0)-dimensional sparse CSR tensor
+consists of three 1-D tensors: ``crow_indices``, ``col_indices`` and
+``values``:
+
+  - The ``crow_indices`` tensor consists of compressed row
+    indices. This is a 1-D tensor of size ``nrows + 1`` (the number of
+    rows plus 1). The last element of ``crow_indices`` is the number
+    of specified elements, ``nse``. This tensor encodes the index in
+    ``values`` and ``col_indices`` depending on where the given row
+    starts. Each successive number in the tensor subtracted by the
+    number before it denotes the number of elements in a given row.
+
+  - The ``col_indices`` tensor contains the column indices of each
+    element. This is a 1-D tensor of size ``nse``.
+
+  - The ``values`` tensor contains the values of the CSR tensor
+    elements. This is a 1-D tensor of size ``nse``.
+
+.. note::
+
+   The index tensors ``crow_indices`` and ``col_indices`` should have
+   element type either ``torch.int64`` (default) or
+   ``torch.int32``. If you want to use MKL-enabled matrix operations,
+   use ``torch.int32``. This is as a result of the default linking of
+   pytorch being with MKL LP64, which uses 32 bit integer indexing.
+
+In the general case, the (B + 2 + K)-dimensional sparse CSR tensor
+consists of two (B + 1)-dimensional index tensors ``crow_indices`` and
+``col_indices``, and of (1 + K)-dimensional ``values`` tensor such
+that
+
+  - ``crow_indices.shape == (*batchsize, nrows + 1)``
+
+  - ``col_indices.shape == (*batchsize, nse)``
+
+  - ``values.shape == (nse, *densesize)``
+
+while the shape of the sparse CSR tensor is ``(*batchsize, nrows,
+ncols, *densesize)`` where ``len(batchsize) == B`` and
+``len(densesize) == K``.
+
+.. note::
+
+   The batches of sparse CSR tensors are dependent: the number of
+   specified elements in all batches must be the same. This somewhat
+   artifical constraint allows efficient storage of the indices of
+   different CSR batches.
+
+.. note::
+
+   The number of sparse and dense dimensions can be acquired using
+   :meth:`torch.Tensor.sparse_dim` and :meth:`torch.Tensor.dense_dim`
+   methods. The batch dimensions can be computed from the tensor
+   shape: ``batchsize = tensor.shape[:-tensor.sparse_dim() -
+   tensor.dense_dim()]``.
+
+.. note::
+
+   The memory consumption of a sparse CSR tensor is at least
+   ``(nrows * 8 + (8 + <size of element type in bytes> *
+   prod(densesize)) * nse) * prod(batchsize)`` bytes (plus a constant
+   overhead from storing other tensor data).
+
+   With the same example data of :ref:`the note in sparse COO format
+   introduction<sparse-coo-docs>`, the memory consumption of a 10 000
+   x 10 000 tensor with 100 000 non-zero 32-bit floating point numbers
+   is at least ``(10000 * 8 + (8 + 4 * 1) * 100 000) * 1 = 1 280 000``
+   bytes when using CSR tensor layout. Notice the 1.6 and 310 fold
+   savings from using CSR storage format compared to using the COO and
+   strided formats, respectively.

 Construction of CSR tensors
---------------------------
+'''''''''''''''''''''''''''

-Sparse CSR matrices can be directly constructed by using the :func:`torch.sparse_csr_tensor`
-method. The user must supply the row and column indices and values tensors separately.
-The ``size`` argument is optional and will be deduced from the the ``crow_indices``
-and ``col_indices`` if it is not present.
+Sparse CSR tensors can be directly constructed by using the
+:func:`torch.sparse_csr_tensor` function. The user must supply the row
+and column indices and values tensors separately where the row indices
+must be specified using the CSR compression encoding.  The ``size``
+argument is optional and will be deduced from the ``crow_indices`` and
+``col_indices`` if it is not present.

    >>> crow_indices = torch.tensor([0, 2, 4])
    >>> col_indices = torch.tensor([0, 1, 0, 1])
    >>> values = torch.tensor([1, 2, 3, 4])
-    >>> csr = torch.sparse_csr_tensor(crow_indices, col_indices, values, dtype=torch.double)
+    >>> csr = torch.sparse_csr_tensor(crow_indices, col_indices, values, dtype=torch.float64)
    >>> csr
    tensor(crow_indices=tensor([0, 2, 4]),
          col_indices=tensor([0, 1, 0, 1]),
@ -422,20 +519,29 @@ and ``col_indices`` if it is not present.
    tensor([[1., 2.],
            [3., 4.]], dtype=torch.float64)

-CSR Tensor Operations
---------------------
+.. note::

-The simplest way of constructing a sparse CSR tensor from a strided or sparse COO
-tensor is to use :meth:`tensor.to_sparse_csr`. Any zeros in the (strided) tensor will
-be interpreted as missing values in the sparse tensor:
+   The values of sparse dimensions in deduced ``size`` is computed
+   from the size of ``crow_indices`` and the maximal index value in
+   ``col_indices``. If the number of columns needs to be larger than
+   in the deduced ``size`` then the ``size`` argument must be
+   specified explicitly.

-    >>> a = torch.tensor([[0, 0, 1, 0], [1, 2, 0, 0], [0, 0, 0, 0]], dtype = torch.float64)
+The simplest way of constructing a 2-D sparse CSR tensor from a
+strided or sparse COO tensor is to use
+:meth:`torch.Tensor.to_sparse_csr` method. Any zeros in the (strided)
+tensor will be interpreted as missing values in the sparse tensor:
+
+    >>> a = torch.tensor([[0, 0, 1, 0], [1, 2, 0, 0], [0, 0, 0, 0]], dtype=torch.float64)
    >>> sp = a.to_sparse_csr()
    >>> sp
    tensor(crow_indices=tensor([0, 1, 3, 3]),
          col_indices=tensor([2, 0, 1]),
          values=tensor([1., 1., 2.]), size=(3, 4), nnz=3, dtype=torch.float64)

+CSR Tensor Operations
+'''''''''''''''''''''
+
 The sparse matrix-vector multiplication can be performed with the
 :meth:`tensor.matmul` method. This is currently the only math operation
 supported on CSR tensors.
@ -446,6 +552,272 @@ supported on CSR tensors.
            [1.3180],
            [0.0000]], dtype=torch.float64)

+.. _sparse-csc-docs:
+
+Sparse CSC Tensor
+-----------------
+
+The sparse CSC (Compressed Sparse Column) tensor format implements the
+CSC format for storage of 2 dimensional tensors with an extension to
+supporting batches of sparse CSC tensors and values being
+multi-dimensional tensors.
+
+.. note::
+
+   Sparse CSC tensor is essentially a transpose of the sparse CSR
+   tensor when the transposition is about swapping the sparse
+   dimensions.
+
+Similarly to :ref:`sparse CSR tensors <sparse-csr-docs>`, a sparse CSC
+tensor consists of three tensors: ``ccol_indices``, ``row_indices``
+and ``values``:
+
+  - The ``ccol_indices`` tensor consists of compressed column
+    indices. This is a (B + 1)-D tensor of shape ``(*batchsize, ncols + 1)``.
+    The last element is the number of specified
+    elements, ``nse``. This tensor encodes the index in ``values`` and
+    ``row_indices`` depending on where the given column starts. Each
+    successive number in the tensor subtracted by the number before it
+    denotes the number of elements in a given column.
+
+  - The ``row_indices`` tensor contains the row indices of each
+    element. This is a (B + 1)-D tensor of shape ``(*batchsize, nse)``.
+
+  - The ``values`` tensor contains the values of the CSC tensor
+    elements. This is a (1 + K)-D tensor of shape ``(nse, *densesize)``.
+
+Construction of CSC tensors
+'''''''''''''''''''''''''''
+
+Sparse CSC tensors can be directly constructed by using the
+:func:`torch.sparse_csc_tensor` function. The user must supply the row
+and column indices and values tensors separately where the column indices
+must be specified using the CSR compression encoding.  The ``size``
+argument is optional and will be deduced from the ``row_indices`` and
+``ccol_indices`` tensors if it is not present.
+
+    >>> ccol_indices = torch.tensor([0, 2, 4])
+    >>> row_indices = torch.tensor([0, 1, 0, 1])
+    >>> values = torch.tensor([1, 2, 3, 4])
+    >>> csc = torch.sparse_csc_tensor(ccol_indices, row_indices, values, dtype=torch.float64)
+    >>> csc
+    tensor(ccol_indices=tensor([0, 2, 4]),
+           row_indices=tensor([0, 1, 0, 1]),
+           values=tensor([1., 2., 3., 4.]), size=(2, 2), nnz=4,
+           dtype=torch.float64, layout=torch.sparse_csc)
+    >>> csc.to_dense()
+    tensor([[1., 3.],
+            [2., 4.]], dtype=torch.float64)
+
+.. note::
+
+   The sparse CSC tensor constructor function has the compressed
+   column indices argument before the row indices argument.
+
+The (0 + 2 + 0)-dimensional sparse CSC tensors can be constructed from
+any two-dimensional tensor using :meth:`torch.Tensor.to_sparse_csc`
+method. Any zeros in the (strided) tensor will be interpreted as
+missing values in the sparse tensor:
+
+    >>> a = torch.tensor([[0, 0, 1, 0], [1, 2, 0, 0], [0, 0, 0, 0]], dtype=torch.float64)
+    >>> sp = a.to_sparse_csc()
+    >>> sp
+    tensor(ccol_indices=tensor([0, 1, 2, 3, 3]),
+           row_indices=tensor([1, 1, 0]),
+           values=tensor([1., 2., 1.]), size=(3, 4), nnz=3, dtype=torch.float64,
+           layout=torch.sparse_csc)
+
+.. _sparse-bsr-docs:
+
+Sparse BSR Tensor
+-----------------
+
+The sparse BSR (Block compressed Sparse Row) tensor format implements the
+BSR format for storage of two-dimensional tensors with an extension to
+supporting batches of sparse BSR tensors and values being blocks of
+multi-dimensional tensors.
+
+A sparse BSR tensor consists of three tensors: ``crow_indices``,
+``col_indices`` and ``values``:
+
+  - The ``crow_indices`` tensor consists of compressed row
+    indices. This is a (B + 1)-D tensor of shape ``(*batchsize,
+    nrowblocks + 1)``.  The last element is the number of specified blocks,
+    ``nse``. This tensor encodes the index in ``values`` and
+    ``col_indices`` depending on where the given column block
+    starts. Each successive number in the tensor subtracted by the
+    number before it denotes the number of blocks in a given row.
+
+  - The ``col_indices`` tensor contains the column block indices of each
+    element. This is a (B + 1)-D tensor of shape ``(*batchsize,
+    nse)``.
+
+  - The ``values`` tensor contains the values of the sparse BSR tensor
+    elements collected into two-dimensional blocks. This is a (1 + 2 +
+    K)-D tensor of shape ``(nse, nrowblocks, ncolblocks,
+    *densesize)``.
+
+Construction of BSR tensors
+'''''''''''''''''''''''''''
+
+Sparse BSR tensors can be directly constructed by using the
+:func:`torch.sparse_bsr_tensor` function. The user must supply the row
+and column block indices and values tensors separately where the row block indices
+must be specified using the CSR compression encoding.
+The ``size`` argument is optional and will be deduced from the ``crow_indices`` and
+``col_indices`` tensors if it is not present.
+
+    >>> crow_indices = torch.tensor([0, 2, 4])
+    >>> col_indices = torch.tensor([0, 1, 0, 1])
+    >>> values = torch.tensor([[[0, 1, 2], [6, 7, 8]],
+    ...                        [[3, 4, 5], [9, 10, 11]],
+    ...                        [[12, 13, 14], [18, 19, 20]],
+    ...                        [[15, 16, 17], [21, 22, 23]]])
+    >>> bsr = torch.sparse_bsr_tensor(crow_indices, col_indices, values, dtype=torch.float64)
+    >>> bsr
+    tensor(crow_indices=tensor([0, 2, 4]),
+           col_indices=tensor([0, 1, 0, 1]),
+           values=tensor([[[ 0.,  1.,  2.],
+                           [ 6.,  7.,  8.]],
+                          [[ 3.,  4.,  5.],
+                           [ 9., 10., 11.]],
+                          [[12., 13., 14.],
+                           [18., 19., 20.]],
+                          [[15., 16., 17.],
+                           [21., 22., 23.]]]),
+           size=(4, 6), nnz=4, dtype=torch.float64, layout=torch.sparse_bsr)
+    >>> bsr.to_dense()
+    tensor([[ 0.,  1.,  2.,  3.,  4.,  5.],
+            [ 6.,  7.,  8.,  9., 10., 11.],
+            [12., 13., 14., 15., 16., 17.],
+            [18., 19., 20., 21., 22., 23.]], dtype=torch.float64)
+
+The (0 + 2 + 0)-dimensional sparse BSR tensors can be constructed from
+any two-dimensional tensor using :meth:`torch.Tensor.to_sparse_bsr`
+method that also requires the specification of the values block size:
+
+    >>> dense = torch.tensor([[0, 1, 2, 3, 4, 5],
+    ...                       [6, 7, 8, 9, 10, 11],
+    ...                       [12, 13, 14, 15, 16, 17],
+    ...                       [18, 19, 20, 21, 22, 23]])
+    >>> bsr = dense.to_sparse_bsr(blocksize=(2, 3))
+    >>> bsr
+    tensor(crow_indices=tensor([0, 2, 4]),
+           col_indices=tensor([0, 1, 0, 1]),
+           values=tensor([[[ 0,  1,  2],
+                           [ 6,  7,  8]],
+                          [[ 3,  4,  5],
+                           [ 9, 10, 11]],
+                          [[12, 13, 14],
+                           [18, 19, 20]],
+                          [[15, 16, 17],
+                           [21, 22, 23]]]), size=(4, 6), nnz=4,
+           layout=torch.sparse_bsr)
+
+.. _sparse-bsc-docs:
+
+Sparse BSC Tensor
+-----------------
+
+The sparse BSC (Block compressed Sparse Column) tensor format implements the
+BSC format for storage of two-dimensional tensors with an extension to
+supporting batches of sparse BSC tensors and values being blocks of
+multi-dimensional tensors.
+
+A sparse BSC tensor consists of three tensors: ``ccol_indices``,
+``row_indices`` and ``values``:
+
+  - The ``ccol_indices`` tensor consists of compressed column
+    indices. This is a (B + 1)-D tensor of shape ``(*batchsize,
+    ncolblocks + 1)``.  The last element is the number of specified blocks,
+    ``nse``. This tensor encodes the index in ``values`` and
+    ``row_indices`` depending on where the given row block
+    starts. Each successive number in the tensor subtracted by the
+    number before it denotes the number of blocks in a given column.
+
+  - The ``row_indices`` tensor contains the row block indices of each
+    element. This is a (B + 1)-D tensor of shape ``(*batchsize,
+    nse)``.
+
+  - The ``values`` tensor contains the values of the sparse BSC tensor
+    elements collected into two-dimensional blocks. This is a (1 + 2 +
+    K)-D tensor of shape ``(nse, nrowblocks, ncolblocks,
+    *densesize)``.
+
+Construction of BSC tensors
+'''''''''''''''''''''''''''
+
+Sparse BSC tensors can be directly constructed by using the
+:func:`torch.sparse_bsc_tensor` function. The user must supply the row
+and column block indices and values tensors separately where the column block indices
+must be specified using the CSR compression encoding.
+The ``size`` argument is optional and will be deduced from the ``ccol_indices`` and
+``row_indices`` tensors if it is not present.
+
+    >>> ccol_indices = torch.tensor([0, 2, 4])
+    >>> row_indices = torch.tensor([0, 1, 0, 1])
+    >>> values = torch.tensor([[[0, 1, 2], [6, 7, 8]],
+    ...                        [[3, 4, 5], [9, 10, 11]],
+    ...                        [[12, 13, 14], [18, 19, 20]],
+    ...                        [[15, 16, 17], [21, 22, 23]]])
+    >>> bsc = torch.sparse_bsc_tensor(ccol_indices, row_indices, values, dtype=torch.float64)
+    >>> bsc
+    tensor(ccol_indices=tensor([0, 2, 4]),
+           row_indices=tensor([0, 1, 0, 1]),
+           values=tensor([[[ 0.,  1.,  2.],
+                           [ 6.,  7.,  8.]],
+                          [[ 3.,  4.,  5.],
+                           [ 9., 10., 11.]],
+                          [[12., 13., 14.],
+                           [18., 19., 20.]],
+                          [[15., 16., 17.],
+                           [21., 22., 23.]]]), size=(4, 6), nnz=4,
+           dtype=torch.float64, layout=torch.sparse_bsc)
+
+Tools for working with sparse compressed tensors
+------------------------------------------------
+
+All sparse compressed tensors --- CSR, CSC, BSR, and BSC tensors ---
+are conceptionally very similar in that their indices data is split
+into two parts: so-called compressed indices that use the CSR
+encoding, and so-called plain indices that are orthogonal to the
+compressed indices. This allows various tools on these tensors to
+share the same implementations that are parameterized by tensor
+layout.
+
+Construction of sparse compressed tensors
+'''''''''''''''''''''''''''''''''''''''''
+
+Sparse CSR, CSC, BSR, and CSC tensors can be constructed by using
+:func:`torch.sparse_compressed_tensor` function that have the same
+interface as the above discussed constructor functions
+:func:`torch.sparse_csr_tensor`, :func:`torch.sparse_csc_tensor`,
+:func:`torch.sparse_bsr_tensor`, and :func:`torch.sparse_bsc_tensor`,
+respectively, but with an extra required ``layout`` argument. The
+following example illustrates a method of constructing CSR and CSC
+tensors using the same input data by specifying the corresponding
+layout parameter to the :func:`torch.sparse_compressed_tensor`
+function:
+
+    >>> compressed_indices = torch.tensor([0, 2, 4])
+    >>> plain_indices = torch.tensor([0, 1, 0, 1])
+    >>> values = torch.tensor([1, 2, 3, 4])
+    >>> csr = torch.sparse_compressed_tensor(compressed_indices, plain_indices, values, layout=torch.sparse_csr)
+    >>> csr
+    tensor(crow_indices=tensor([0, 2, 4]),
+           col_indices=tensor([0, 1, 0, 1]),
+           values=tensor([1, 2, 3, 4]), size=(2, 2), nnz=4,
+           layout=torch.sparse_csr)
+    >>> csc = torch.sparse_compressed_tensor(compressed_indices, plain_indices, values, layout=torch.sparse_csc)
+    >>> csc
+    tensor(ccol_indices=tensor([0, 2, 4]),
+           row_indices=tensor([0, 1, 0, 1]),
+           values=tensor([1, 2, 3, 4]), size=(2, 2), nnz=4,
+           layout=torch.sparse_csc)
+    >>> (csr.transpose(0, 1).to_dense() == csc.to_dense()).all()
+    tensor(True)
+
+
 Supported Linear Algebra operations
 +++++++++++++++++++++++++++++++++++

@ -496,16 +868,21 @@ Tensor methods and sparse
 The following Tensor methods are related to sparse tensors:

 .. autosummary::
+    :toctree: generated
    :nosignatures:

    Tensor.is_sparse
+    Tensor.is_sparse_csr
    Tensor.dense_dim
    Tensor.sparse_dim
    Tensor.sparse_mask
    Tensor.to_sparse
    Tensor.to_sparse_coo
    Tensor.to_sparse_csr
-    Tensor.indices
+    Tensor.to_sparse_csc
+    Tensor.to_sparse_bsr
+    Tensor.to_sparse_bsc
+    Tensor.to_dense
    Tensor.values

 The following Tensor methods are specific to sparse COO tensors:
@ -518,16 +895,26 @@ The following Tensor methods are specific to sparse COO tensors:
    Tensor.sparse_resize_
    Tensor.sparse_resize_and_clear_
    Tensor.is_coalesced
-    Tensor.to_dense
+    Tensor.indices

-The following methods are specific to :ref:`sparse CSR tensors <sparse-csr-docs>`:
+The following methods are specific to :ref:`sparse CSR tensors <sparse-csr-docs>` and :ref:`sparse BSR tensors <sparse-bsr-docs>`:

 .. autosummary::
+    :toctree: generated
    :nosignatures:

    Tensor.crow_indices
    Tensor.col_indices

+The following methods are specific to :ref:`sparse CSC tensors <sparse-csc-docs>` and :ref:`sparse BSC tensors <sparse-bsc-docs>`:
+
+.. autosummary::
+    :toctree: generated
+    :nosignatures:
+
+    Tensor.row_indices
+    Tensor.ccol_indices
+
 The following Tensor methods support sparse COO tensors:

 :meth:`~torch.Tensor.add`
@ -590,6 +977,10 @@ Torch functions specific to sparse Tensors

    sparse_coo_tensor
    sparse_csr_tensor
+    sparse_csc_tensor
+    sparse_bsr_tensor
+    sparse_bsc_tensor
+    sparse_compressed_tensor
    sparse.sum
    sparse.addmm
    sparse.sampled_addmm
@ -629,3 +1020,35 @@ The following :mod:`torch` functions support sparse tensors:
 :func:`~torch.vstack`
 :func:`~torch.zeros`
 :func:`~torch.zeros_like`
+
+In addition, all zero-preserving unary functions support sparse
+COO/CSR/CSC/BSR/CSR tensor inputs:
+
+:func:`~torch.abs`
+:func:`~torch.asin`
+:func:`~torch.asinh`
+:func:`~torch.atan`
+:func:`~torch.atanh`
+:func:`~torch.ceil`
+:func:`~torch.conj_physical`
+:func:`~torch.floor`
+:func:`~torch.log1p`
+:func:`~torch.neg`
+:func:`~torch.round`
+:func:`~torch.sin`
+:func:`~torch.sinh`
+:func:`~torch.sign`
+:func:`~torch.sgn`
+:func:`~torch.signbit`
+:func:`~torch.tan`
+:func:`~torch.tanh`
+:func:`~torch.trunc`
+:func:`~torch.expm1`
+:func:`~torch.sqrt`
+:func:`~torch.angle`
+:func:`~torch.isinf`
+:func:`~torch.isposinf`
+:func:`~torch.isneginf`
+:func:`~torch.isnan`
+:func:`~torch.erf`
+:func:`~torch.erfinv`
--- a/docs/source/tensors.rst
+++ b/docs/source/tensors.rst
@ -669,7 +669,12 @@ Tensor class reference
    Tensor.arctanh_
    Tensor.tolist
    Tensor.topk
+    Tensor.to_dense
    Tensor.to_sparse
+    Tensor.to_sparse_csr
+    Tensor.to_sparse_csc
+    Tensor.to_sparse_bsr
+    Tensor.to_sparse_bsc
    Tensor.trace
    Tensor.transpose
    Tensor.transpose_
--- a/torch/_tensor_docs.py
+++ b/torch/_tensor_docs.py
@ -5319,10 +5319,7 @@ add_docstr_all(
    r"""
 to_dense() -> Tensor

-Creates a strided copy of :attr:`self`.
-
-.. warning::
-  Throws an error if :attr:`self` is a strided tensor.
+Creates a strided copy of :attr:`self` if :attr:`self` is not a strided tensor, otherwise returns :attr:`self`.

 Example::

@ -5342,6 +5339,7 @@ add_docstr_all(
    "to_sparse",
    r"""
 to_sparse(sparseDims) -> Tensor
+
 Returns a sparse copy of the tensor.  PyTorch supports sparse tensors in
 :ref:`coordinate format <sparse-coo-docs>`.

@ -5371,7 +5369,8 @@ add_docstr_all(
    "to_sparse_csr",
    r"""
 to_sparse_csr() -> Tensor
-Convert a tensor to compressed row storage format. Only works with 2D tensors.
+
+Convert a tensor to compressed row storage format (CSR). Only works with 2D tensors.

 Example::

@ -5383,10 +5382,28 @@ Example::
 """,
 )

+add_docstr_all(
+    "to_sparse_csc",
+    r"""
+to_sparse_csc() -> Tensor
+
+Convert a tensor to compressed column storage (CSC) format. Only works with 2D tensors.
+
+Example::
+
+    >>> dense = torch.randn(5, 5)
+    >>> sparse = dense.to_sparse_csc()
+    >>> sparse._nnz()
+    25
+
+""",
+)
+
 add_docstr_all(
    "to_sparse_bsr",
    r"""
 to_sparse_bsr(blocksize) -> Tensor
+
 Convert a CSR tensor to a block sparse row (BSR) storage format of given blocksize.

 Example::
@ -5400,6 +5417,24 @@ Example::
 """,
 )

+add_docstr_all(
+    "to_sparse_bsc",
+    r"""
+to_sparse_bsc(blocksize) -> Tensor
+
+Convert a CSR tensor to a block sparse column (BSC) storage format of given blocksize.
+
+Example::
+
+    >>> dense = torch.randn(10, 10)
+    >>> sparse = dense.to_sparse_csr()
+    >>> sparse_bsc = sparse.to_sparse_bsc((5, 5))
+    >>> sparse_bsc.row_indices()
+    tensor([0, 1, 0, 1])
+
+""",
+)
+
 add_docstr_all(
    "to_mkldnn",
    r"""
--- a/torch/_torch_docs.py
+++ b/torch/_torch_docs.py
@ -10252,37 +10252,39 @@ Example::

 add_docstr(
    torch.sparse_compressed_tensor,
-    r"""
-sparse_compressed_tensor(compressed_indices, plain_indices, values, size=None,
-                         *, dtype=None, layout=None, device=None, requires_grad=False) -> Tensor
+    r"""sparse_compressed_tensor(compressed_indices, plain_indices, values, size=None, """
+    r"""*, dtype=None, layout=None, device=None, requires_grad=False) -> Tensor

 Constructs a :ref:`sparse tensor in Compressed Sparse format - CSR,
-CSC, BSR, or BSC - <sparse-csr-docs>` with specified values at the
-given :attr:`compressed_indices` and :attr:`plain_indices`. Sparse
+CSC, BSR, or BSC - <sparse-compressed-docs>` with specified values at
+the given :attr:`compressed_indices` and :attr:`plain_indices`. Sparse
 matrix multiplication operations in Compressed Sparse format are
 typically faster than that for sparse tensors in COO format. Make you
 have a look at :ref:`the note on the data type of the indices
-<sparse-csr-docs>`.
+<sparse-compressed-docs>`.

 Args:
-    compressed_indices (array_like): One-dimensional array of size
-        size[cdim] + 1 where cdim is 0 or 1 depending on the layout.
-        The last element is the number of non-zeros. This tensor
-        encodes the index in values and plain_indices depending on
-        where the given compressed dimension (row or column)
-        starts. Each successive number in the tensor subtracted by the
-        number before it denotes the number of elements in a given
-        compressed dimension.
+    compressed_indices (array_like): (B+1)-dimensional array of size
+        ``(*batchsize, compressed_dim_size + 1)``.  The last element of
+        each batch is the number of non-zero elements or blocks. This
+        tensor encodes the index in ``values`` and ``plain_indices``
+        depending on where the given compressed dimension (row or
+        column) starts. Each successive number in the tensor
+        subtracted by the number before it denotes the number of
+        elements or blocks in a given compressed dimension.
    plain_indices (array_like): Plain dimension (column or row)
-        co-ordinates of each element in values. Strictly one
-        dimensional tensor with the same length as values.
+        co-ordinates of each element or block in values. (B+1)-dimensional
+        tensor with the same length as values.
    values (array_list): Initial values for the tensor. Can be a list,
-        tuple, NumPy ``ndarray``, scalar, and other types.  For block
-        sparse formats, the dimensionality of values must be two plus
-        the dimensionality of plain_indices.
+        tuple, NumPy ``ndarray``, scalar, and other types.  that
+        represents a (1+K)-dimensional or (1+2+K)-dimensional tensor
+        where ``K`` is the number of dense dimensions.
    size (list, tuple, :class:`torch.Size`, optional): Size of the
-        sparse tensor. If not provided, the size will be inferred as
-        the minimum size big enough to hold all non-zero elements.
+        sparse tensor: ``(*batchsize, nrows * blocksize[0], ncols *
+        blocksize[1], *densesize)`` where ``blocksize[0] ==
+        blocksize[1] == 1`` for CSR and CSC formats. If not provided,
+        the size will be inferred as the minimum size big enough to
+        hold all non-zero elements or blocks.

 Keyword args:
    dtype (:class:`torch.dtype`, optional): the desired data type of
@ -10327,20 +10329,24 @@ in CSR format are typically faster than that for sparse tensors in COO format. M
 at :ref:`the note on the data type of the indices <sparse-csr-docs>`.

 Args:
-    crow_indices (array_like): One-dimensional array of size size[0] + 1.
-        The last element is the number of non-zeros. This tensor
-        encodes the index in values and col_indices depending on where
-        the given row starts. Each successive number in the tensor
-        subtracted by the number before it denotes the number of
-        elements in a given row.
+    crow_indices (array_like): (B+1)-dimensional array of size
+        ``(*batchsize, nrows + 1)``.  The last element of each batch
+        is the number of non-zeros. This tensor encodes the index in
+        values and col_indices depending on where the given row
+        starts. Each successive number in the tensor subtracted by the
+        number before it denotes the number of elements in a given
+        row.
    col_indices (array_like): Column co-ordinates of each element in
-        values. Strictly one dimensional tensor with the same length
+        values. (B+1)-dimensional tensor with the same length
        as values.
    values (array_list): Initial values for the tensor. Can be a list,
-        tuple, NumPy ``ndarray``, scalar, and other types.
+        tuple, NumPy ``ndarray``, scalar, and other types that
+        represents a (1+K)-dimensonal tensor where ``K`` is the number
+        of dense dimensions.
    size (list, tuple, :class:`torch.Size`, optional): Size of the
-        sparse tensor. If not provided, the size will be inferred as
-        the minimum size big enough to hold all non-zero elements.
+        sparse tensor: ``(*batchsize, nrows, ncols, *densesize)``. If
+        not provided, the size will be inferred as the minimum size
+        big enough to hold all non-zero elements.

 Keyword args:
    dtype (:class:`torch.dtype`, optional): the desired data type of
@ -10376,27 +10382,31 @@ add_docstr(
 sparse_csc_tensor(ccol_indices, row_indices, values, size=None, *, dtype=None, device=None, requires_grad=False) -> Tensor

 Constructs a :ref:`sparse tensor in CSC (Compressed Sparse Column)
-<sparse-csr-docs>` with specified values at the given
+<sparse-csc-docs>` with specified values at the given
 :attr:`ccol_indices` and :attr:`row_indices`. Sparse matrix
 multiplication operations in CSC format are typically faster than that
 for sparse tensors in COO format. Make you have a look at :ref:`the
-note on the data type of the indices <sparse-csr-docs>`.
+note on the data type of the indices <sparse-csc-docs>`.

 Args:
-    ccol_indices (array_like): One-dimensional array of size size[1] + 1.
-        The last element is the number of non-zeros. This tensor
-        encodes the index in values and row_indices depending on where
-        the given column starts. Each successive number in the tensor
-        subtracted by the number before it denotes the number of
-        elements in a given column.
+    ccol_indices (array_like): (B+1)-dimensional array of size
+        ``(*batchsize, ncols + 1)``.  The last element of each batch
+        is the number of non-zeros. This tensor encodes the index in
+        values and row_indices depending on where the given column
+        starts. Each successive number in the tensor subtracted by the
+        number before it denotes the number of elements in a given
+        column.
    row_indices (array_like): Row co-ordinates of each element in
-        values. Strictly one dimensional tensor with the same length
-        as values.
+        values. (B+1)-dimensional tensor with the same length as
+        values.
    values (array_list): Initial values for the tensor. Can be a list,
-        tuple, NumPy ``ndarray``, scalar, and other types.
+        tuple, NumPy ``ndarray``, scalar, and other types that
+        represents a (1+K)-dimensonal tensor where ``K`` is the number
+        of dense dimensions.
    size (list, tuple, :class:`torch.Size`, optional): Size of the
-        sparse tensor. If not provided, the size will be inferred as
-        the minimum size big enough to hold all non-zero elements.
+        sparse tensor: ``(*batchsize, nrows, ncols, *densesize)``. If
+        not provided, the size will be inferred as the minimum size
+        big enough to hold all non-zero elements.

 Keyword args:
    dtype (:class:`torch.dtype`, optional): the desired data type of
@ -10432,29 +10442,33 @@ add_docstr(
 sparse_bsr_tensor(crow_indices, col_indices, values, size=None, *, dtype=None, device=None, requires_grad=False) -> Tensor

 Constructs a :ref:`sparse tensor in BSR (Block Compressed Sparse Row))
-<sparse-csr-docs>` with specified 2-dimensional blocks at the given
+<sparse-bsr-docs>` with specified 2-dimensional blocks at the given
 :attr:`crow_indices` and :attr:`col_indices`. Sparse matrix
 multiplication operations in BSR format are typically faster than that
 for sparse tensors in COO format. Make you have a look at :ref:`the
-note on the data type of the indices <sparse-csr-docs>`.
+note on the data type of the indices <sparse-bsr-docs>`.

 Args:
-    crow_indices (array_like): One-dimensional array of size size[0] +
-        1. The last element is the number of non-zeros. This tensor
-        encodes the index in values and col_indices depending on where
-        the given row starts. Each successive number in the tensor
+    crow_indices (array_like): (B+1)-dimensional array of size
+        ``(*batchsize, nrowblocks + 1)``.  The last element of each
+        batch is the number of non-zeros. This tensor encodes the
+        block index in values and col_indices depending on where the
+        given row block starts. Each successive number in the tensor
        subtracted by the number before it denotes the number of
        blocks in a given row.
-    col_indices (array_like): Column co-ordinates of each block in
-        values. Strictly one dimensional tensor with the same length
-        as values.
+    col_indices (array_like): Column block co-ordinates of each block
+        in values. (B+1)-dimensional tensor with the same length as
+        values.
    values (array_list): Initial values for the tensor. Can be a list,
-        tuple, NumPy ``ndarray``, scalar, and other types. The
-        dimensionality of values must be two plus the dimensionality
-        of col_indices.
+        tuple, NumPy ``ndarray``, scalar, and other types that
+        represents a (1 + 2 + K)-dimensonal tensor where ``K`` is the
+        number of dense dimensions.
    size (list, tuple, :class:`torch.Size`, optional): Size of the
-        sparse tensor. If not provided, the size will be inferred as
-        the minimum size big enough to hold all non-zero blocks.
+        sparse tensor: ``(*batchsize, nrows * blocksize[0], ncols *
+        blocksize[1], *densesize)`` where ``blocksize ==
+        values.shape[1:3]``. If not provided, the size will be
+        inferred as the minimum size big enough to hold all non-zero
+        blocks.

 Keyword args:
    dtype (:class:`torch.dtype`, optional): the desired data type of
@ -10479,7 +10493,6 @@ Example::
           col_indices=tensor([0, 1]),
           values=tensor([[[1., 2.],
                           [3., 4.]],
-
                          [[5., 6.],
                           [7., 8.]]]), size=(2, 2), nnz=2, dtype=torch.float64,
           layout=torch.sparse_bsr)
@ -10494,28 +10507,32 @@ add_docstr(
 sparse_bsc_tensor(ccol_indices, row_indices, values, size=None, *, dtype=None, device=None, requires_grad=False) -> Tensor

 Constructs a :ref:`sparse tensor in BSC (Block Compressed Sparse
-Column)) <sparse-csr-docs>` with specified 2-dimensional blocks at the
+Column)) <sparse-bsc-docs>` with specified 2-dimensional blocks at the
 given :attr:`ccol_indices` and :attr:`row_indices`. Sparse matrix
 multiplication operations in BSC format are typically faster than that
 for sparse tensors in COO format. Make you have a look at :ref:`the
-note on the data type of the indices <sparse-csr-docs>`.
+note on the data type of the indices <sparse-bsc-docs>`.

 Args:
-    ccol_indices (array_like): One-dimensional array of size size[1] +
-        1. The last element is the number of non-zeros. This tensor
-        encodes the index in values and row_indices depending on where
-        the given column starts. Each successive number in the tensor
-        subtracted by the number before it denotes the number of
-        elements in a given column.
-    row_indices (array_like): Row co-ordinates of each element in
-        values. Strictly one dimensional tensor with the same length
+    ccol_indices (array_like): (B+1)-dimensional array of size
+        ``(*batchsize, ncolblocks + 1)``. The last element of each
+        batch is the number of non-zeros. This tensor encodes the
+        index in values and row_indices depending on where the given
+        column starts. Each successive number in the tensor subtracted
+        by the number before it denotes the number of elements in a
+        given column.
+    row_indices (array_like): Row block co-ordinates of each block in
+        values. (B+1)-dimensional tensor with the same length
        as values.
    values (array_list): Initial blocks for the tensor. Can be a list,
-        tuple, NumPy ``ndarray``, and other types. The dimensionality
-        of values must be two plus the dimensionality of row_indices.
+        tuple, NumPy ``ndarray``, and other types that
+        represents a (1 + 2 + K)-dimensonal tensor where ``K`` is the
+        number of dense dimensions.
    size (list, tuple, :class:`torch.Size`, optional): Size of the
-        sparse tensor. If not provided, the size will be inferred as
-        the minimum size big enough to hold all non-zero blocks.
+        sparse tensor: ``(*batchsize, nrows * blocksize[0], ncols *
+        blocksize[1], *densesize)`` If not provided, the size will be
+        inferred as the minimum size big enough to hold all non-zero
+        blocks.

 Keyword args:
    dtype (:class:`torch.dtype`, optional): the desired data type of
@ -10540,7 +10557,6 @@ Example::
           row_indices=tensor([0, 1]),
           values=tensor([[[1., 2.],
                           [3., 4.]],
-
                          [[5., 6.],
                           [7., 8.]]]), size=(2, 2), nnz=2, dtype=torch.float64,
           layout=torch.sparse_bsc)