Spaces:
Runtime error
Runtime error
Commit
·
a2d6b9a
1
Parent(s):
a21c8ab
Update app.py
Browse files
app.py
CHANGED
|
@@ -108,8 +108,8 @@ mqa_total_time = 0.
|
|
| 108 |
mha_total_time = 0.
|
| 109 |
|
| 110 |
for i in range(n_start, n):
|
| 111 |
-
shared_time = out_exec(bs, h, i, d)[2] + softmax_exec(bs, h, i , d)[2] \
|
| 112 |
-
|
| 113 |
mha_time = shared_time + qkv_mha_exec(bs, h, i, d)[2] + att1_mha_exec(bs, h, i, d)[2] + att2_mha_exec(bs, h, i, d)[2]
|
| 114 |
mha_total_time += l*mha_time
|
| 115 |
mqa_time = shared_time + qkv_mqa_exec(bs, h, i, d)[2] + att1_mqa_exec(bs, h, i, d)[2] + att2_mqa_exec(bs, h, i, d)[2]
|
|
|
|
| 108 |
mha_total_time = 0.
|
| 109 |
|
| 110 |
for i in range(n_start, n):
|
| 111 |
+
shared_time = out_exec(bs, h, i, d)[2] + softmax_exec(bs, h, i , d)[2] + 2*ln_exec(bs, h, i, d)[2] \
|
| 112 |
+
+ 2*mlp_exec(bs, h, i, d)[2] + 3*ln_exec(bs, h, i, d)
|
| 113 |
mha_time = shared_time + qkv_mha_exec(bs, h, i, d)[2] + att1_mha_exec(bs, h, i, d)[2] + att2_mha_exec(bs, h, i, d)[2]
|
| 114 |
mha_total_time += l*mha_time
|
| 115 |
mqa_time = shared_time + qkv_mqa_exec(bs, h, i, d)[2] + att1_mqa_exec(bs, h, i, d)[2] + att2_mqa_exec(bs, h, i, d)[2]
|