[nit] fix xavier init doc (#157100)

Remove part of the documentation that is irrelevant and confusing at best, probably a copy-paste mistake: <img src="https://github.com/user-attachments/assets/77fa5734-5a5a-4f8d-80a5-bc3269668e07" width="500"> Pull Request resolved: https://github.com/pytorch/pytorch/pull/157100 Approved by: https://github.com/mikaylagawarecki
2025-10-20 21:14:14 +08:00 · 2025-06-27 19:13:35 +00:00
parent 75a7d9e868
commit 8a88c6e85a
1 changed files with 0 additions and 16 deletions
--- a/torch/nn/init.py
+++ b/torch/nn/init.py
@ -459,14 +459,6 @@ def xavier_uniform_(
    Examples:
        >>> w = torch.empty(3, 5)
        >>> nn.init.xavier_uniform_(w, gain=nn.init.calculate_gain("relu"))
-
-    Note:
-        Be aware that ``fan_in`` and ``fan_out`` are calculated assuming
-        that the weight matrix is used in a transposed manner,
-        (i.e., ``x @ w.T`` in ``Linear`` layers, where ``w.shape = [fan_out, fan_in]``).
-        This is important for correct initialization.
-        If you plan to use ``x @ w``, where ``w.shape = [fan_in, fan_out]``,
-        pass in a transposed weight matrix, i.e. ``nn.init.xavier_uniform_(w.T, ...)``.
    """
    fan_in, fan_out = _calculate_fan_in_and_fan_out(tensor)
    std = gain * math.sqrt(2.0 / float(fan_in + fan_out))
@ -499,14 +491,6 @@ def xavier_normal_(
    Examples:
        >>> w = torch.empty(3, 5)
        >>> nn.init.xavier_normal_(w)
-
-    Note:
-        Be aware that ``fan_in`` and ``fan_out`` are calculated assuming
-        that the weight matrix is used in a transposed manner,
-        (i.e., ``x @ w.T`` in ``Linear`` layers, where ``w.shape = [fan_out, fan_in]``).
-        This is important for correct initialization.
-        If you plan to use ``x @ w``, where ``w.shape = [fan_in, fan_out]``,
-        pass in a transposed weight matrix, i.e. ``nn.init.xavier_normal_(w.T, ...)``.
    """
    fan_in, fan_out = _calculate_fan_in_and_fan_out(tensor)
    std = gain * math.sqrt(2.0 / float(fan_in + fan_out))