harmdevries commited on
Commit
81ea362
·
1 Parent(s): ebde2f8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -3
app.py CHANGED
@@ -149,7 +149,7 @@ c1.write("Cached keys and values (GB)")
149
  acts = round(2*bs*l*(d/h)*h*2*n/1e9, 2)
150
  c2.write(str(acts))
151
 
152
- st.subheader("Multi-Query Attention")
153
  c1, c2 = st.columns([2, 4])
154
  num_params = (10+2/h)*l*d*d
155
  c1.write("Num Parameters (in B)")
@@ -160,8 +160,12 @@ c1.write("Cached keys and values (GB)")
160
  acts = round(2*bs*l*(d/h)*2*n/1e9, 2)
161
  c2.write(str(acts))
162
 
163
- st.subheader("How we approximate the inference time")
164
- st.write("TODO")
 
 
 
 
165
 
166
  breakdown = st.checkbox("Show breakdown per operation")
167
  if breakdown:
 
149
  acts = round(2*bs*l*(d/h)*h*2*n/1e9, 2)
150
  c2.write(str(acts))
151
 
152
+ st.caption("Multi-Query Attention")
153
  c1, c2 = st.columns([2, 4])
154
  num_params = (10+2/h)*l*d*d
155
  c1.write("Num Parameters (in B)")
 
160
  acts = round(2*bs*l*(d/h)*2*n/1e9, 2)
161
  c2.write(str(acts))
162
 
163
+ st.subheader("Approximations")
164
+ st.markdown("We estimate the time for each matrix multiplication")
165
+
166
+ st.latex("C = A \dot B, A \in R^{NxM}")
167
+
168
+
169
 
170
  breakdown = st.checkbox("Show breakdown per operation")
171
  if breakdown: