harmdevries commited on
Commit
ebde2f8
·
1 Parent(s): 4bb67b3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -137,8 +137,8 @@ c2.write(str(round(mqa_total_time, 2)))
137
  c1.write("Speed-up MQA over MHA: ")
138
  c2.write(str(round(mha_total_time/mqa_total_time,2)))
139
 
140
- st.header("Memory consumption")
141
- st.subheader("MHA")
142
  c1, c2 = st.columns([2, 4])
143
  num_params = 12*l*d*d
144
  c1.write("Num Parameters (in B)")
@@ -149,7 +149,7 @@ c1.write("Cached keys and values (GB)")
149
  acts = round(2*bs*l*(d/h)*h*2*n/1e9, 2)
150
  c2.write(str(acts))
151
 
152
- st.subheader("MQA")
153
  c1, c2 = st.columns([2, 4])
154
  num_params = (10+2/h)*l*d*d
155
  c1.write("Num Parameters (in B)")
 
137
  c1.write("Speed-up MQA over MHA: ")
138
  c2.write(str(round(mha_total_time/mqa_total_time,2)))
139
 
140
+ st.subheader("Memory consumption")
141
+ st.caption("Multi-Head Attention")
142
  c1, c2 = st.columns([2, 4])
143
  num_params = 12*l*d*d
144
  c1.write("Num Parameters (in B)")
 
149
  acts = round(2*bs*l*(d/h)*h*2*n/1e9, 2)
150
  c2.write(str(acts))
151
 
152
+ st.subheader("Multi-Query Attention")
153
  c1, c2 = st.columns([2, 4])
154
  num_params = (10+2/h)*l*d*d
155
  c1.write("Num Parameters (in B)")