Spaces:
Runtime error
Runtime error
Commit
·
a2d6b9a
1
Parent(s):
a21c8ab
Update app.py
Browse files
app.py
CHANGED
@@ -108,8 +108,8 @@ mqa_total_time = 0.
|
|
108 |
mha_total_time = 0.
|
109 |
|
110 |
for i in range(n_start, n):
|
111 |
-
shared_time = out_exec(bs, h, i, d)[2] + softmax_exec(bs, h, i , d)[2] \
|
112 |
-
|
113 |
mha_time = shared_time + qkv_mha_exec(bs, h, i, d)[2] + att1_mha_exec(bs, h, i, d)[2] + att2_mha_exec(bs, h, i, d)[2]
|
114 |
mha_total_time += l*mha_time
|
115 |
mqa_time = shared_time + qkv_mqa_exec(bs, h, i, d)[2] + att1_mqa_exec(bs, h, i, d)[2] + att2_mqa_exec(bs, h, i, d)[2]
|
|
|
108 |
mha_total_time = 0.
|
109 |
|
110 |
for i in range(n_start, n):
|
111 |
+
shared_time = out_exec(bs, h, i, d)[2] + softmax_exec(bs, h, i , d)[2] + 2*ln_exec(bs, h, i, d)[2] \
|
112 |
+
+ 2*mlp_exec(bs, h, i, d)[2] + 3*ln_exec(bs, h, i, d)
|
113 |
mha_time = shared_time + qkv_mha_exec(bs, h, i, d)[2] + att1_mha_exec(bs, h, i, d)[2] + att2_mha_exec(bs, h, i, d)[2]
|
114 |
mha_total_time += l*mha_time
|
115 |
mqa_time = shared_time + qkv_mqa_exec(bs, h, i, d)[2] + att1_mqa_exec(bs, h, i, d)[2] + att2_mqa_exec(bs, h, i, d)[2]
|