KaleiNeely
commited on
Commit
•
dfc9ae3
1
Parent(s):
29770da
Update modeling_rwkv6.py
Browse files- modeling_rwkv6.py +1 -1
modeling_rwkv6.py
CHANGED
@@ -132,7 +132,7 @@ class Rwkv6SelfAttention(nn.Module):
|
|
132 |
|
133 |
TIME_DECAY_EXTRA_DIM = 64
|
134 |
if hidden_size == 4096: #7b
|
135 |
-
|
136 |
self.time_decay_w1 = nn.Parameter(torch.empty(hidden_size, TIME_DECAY_EXTRA_DIM))
|
137 |
self.time_decay_w2 = nn.Parameter(torch.empty(TIME_DECAY_EXTRA_DIM, attention_hidden_size))
|
138 |
|
|
|
132 |
|
133 |
TIME_DECAY_EXTRA_DIM = 64
|
134 |
if hidden_size == 4096: #7b
|
135 |
+
TIME_DECAY_EXTRA_DIM = 128
|
136 |
self.time_decay_w1 = nn.Parameter(torch.empty(hidden_size, TIME_DECAY_EXTRA_DIM))
|
137 |
self.time_decay_w2 = nn.Parameter(torch.empty(TIME_DECAY_EXTRA_DIM, attention_hidden_size))
|
138 |
|