Spaces:
Runtime error
Runtime error
Commit
·
ebde2f8
1
Parent(s):
4bb67b3
Update app.py
Browse files
app.py
CHANGED
@@ -137,8 +137,8 @@ c2.write(str(round(mqa_total_time, 2)))
|
|
137 |
c1.write("Speed-up MQA over MHA: ")
|
138 |
c2.write(str(round(mha_total_time/mqa_total_time,2)))
|
139 |
|
140 |
-
st.
|
141 |
-
st.
|
142 |
c1, c2 = st.columns([2, 4])
|
143 |
num_params = 12*l*d*d
|
144 |
c1.write("Num Parameters (in B)")
|
@@ -149,7 +149,7 @@ c1.write("Cached keys and values (GB)")
|
|
149 |
acts = round(2*bs*l*(d/h)*h*2*n/1e9, 2)
|
150 |
c2.write(str(acts))
|
151 |
|
152 |
-
st.subheader("
|
153 |
c1, c2 = st.columns([2, 4])
|
154 |
num_params = (10+2/h)*l*d*d
|
155 |
c1.write("Num Parameters (in B)")
|
|
|
137 |
c1.write("Speed-up MQA over MHA: ")
|
138 |
c2.write(str(round(mha_total_time/mqa_total_time,2)))
|
139 |
|
140 |
+
st.subheader("Memory consumption")
|
141 |
+
st.caption("Multi-Head Attention")
|
142 |
c1, c2 = st.columns([2, 4])
|
143 |
num_params = 12*l*d*d
|
144 |
c1.write("Num Parameters (in B)")
|
|
|
149 |
acts = round(2*bs*l*(d/h)*h*2*n/1e9, 2)
|
150 |
c2.write(str(acts))
|
151 |
|
152 |
+
st.subheader("Multi-Query Attention")
|
153 |
c1, c2 = st.columns([2, 4])
|
154 |
num_params = (10+2/h)*l*d*d
|
155 |
c1.write("Num Parameters (in B)")
|