Upload MyLLaMa
Browse files- llama.py +2 -2
- model.safetensors +2 -2
llama.py
CHANGED
@@ -92,7 +92,7 @@ class RMSNorm(nn.Module):
|
|
92 |
super().__init__()
|
93 |
|
94 |
self.dim = dim
|
95 |
-
self.
|
96 |
data=torch.nn.init.normal_(torch.zeros((dim,))), requires_grad=True
|
97 |
)
|
98 |
self.eps = eps
|
@@ -111,7 +111,7 @@ class RMSNorm(nn.Module):
|
|
111 |
return (
|
112 |
x
|
113 |
/ torch.sqrt_(torch.mean(torch.square(x), dim=-1) + self.eps)[:, :, None]
|
114 |
-
* self.
|
115 |
)
|
116 |
|
117 |
def extra_repr(self) -> str:
|
|
|
92 |
super().__init__()
|
93 |
|
94 |
self.dim = dim
|
95 |
+
self.trainable = nn.Parameter(
|
96 |
data=torch.nn.init.normal_(torch.zeros((dim,))), requires_grad=True
|
97 |
)
|
98 |
self.eps = eps
|
|
|
111 |
return (
|
112 |
x
|
113 |
/ torch.sqrt_(torch.mean(torch.square(x), dim=-1) + self.eps)[:, :, None]
|
114 |
+
* self.trainable
|
115 |
)
|
116 |
|
117 |
def extra_repr(self) -> str:
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daef12499060e6075aece26c79ed43c39d7a1f9ebade23e92004922b5eba2a87
|
3 |
+
size 3161813808
|