Spaces:
Running
on
Zero
Running
on
Zero
import torch | |
from torch import nn | |
class RMSNorm(nn.Module): | |
""" | |
Initialize the RMSNorm normalization layer. | |
Args: | |
dim (int): The dimension of the input tensor. | |
eps (float, optional): A small value added to the denominator for numerical stability. Default is 1e-6. | |
Attributes: | |
eps (float): A small value added to the denominator for numerical stability. | |
weight (nn.Parameter): Learnable scaling parameter. | |
""" | |
def __init__(self, dim: int, eps: float = 1e-6): | |
super().__init__() | |
self.eps = eps | |
self.weight = nn.Parameter(torch.ones(dim)) | |
def _norm(self, x: torch.Tensor): | |
return x * torch.rsqrt(x.pow(2).mean(-1, keepdim=True) + self.eps) | |
def forward(self, x: torch.Tensor): | |
output = self._norm(x.float()).type_as(x) | |
return output * self.weight | |
def reset_parameters(self): | |
torch.nn.init.ones_(self.weight) # type: ignore |