diff --git a/python/mlx/nn/layers/normalization.py b/python/mlx/nn/layers/normalization.py index d5e1a1c6e..9c77667e7 100644 --- a/python/mlx/nn/layers/normalization.py +++ b/python/mlx/nn/layers/normalization.py @@ -198,7 +198,7 @@ class BatchNorm(Module): batch, ``C`` is the number of features or channels, and ``L`` is the sequence length. The output has the same shape as the input. For four-dimensional arrays, the shape is ``NHWC``, where ``H`` and ``W`` are - the height and width respecitvely. + the height and width respectively. For more information on Batch Normalization, see the original paper `Batch Normalization: Accelerating Deep Network Training by Reducing Internal