harmdevries commited on
Commit
8f8d70a
·
1 Parent(s): 3ddfba1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -4
app.py CHANGED
@@ -86,8 +86,6 @@ def print_kernel_execution(c1, c2, comp_flop, mem_bytes):
86
 
87
  return exec_time
88
 
89
-
90
-
91
  st.sidebar.header("Transformer parameters")
92
  col1, col2 = st.sidebar.columns([2, 4])
93
 
@@ -115,7 +113,7 @@ for i in range(n_start, n):
115
  mqa_time = shared_time + qkv_mqa_exec(bs, h, i, d)[2] + att1_mqa_exec(bs, h, i, d)[2] + att2_mqa_exec(bs, h, i, d)[2]
116
  mqa_total_time += l*mqa_time
117
 
118
- c1, c2 = st.columns(2, 4)
119
  c1.write("Multi-Head Attention:")
120
  c2.write(str(round(mha_total_time, 2)))
121
  c1.write("Multi-Query Attention:")
@@ -125,7 +123,7 @@ c2.write(str(round(mha_total_time/mqa_total_time),2))
125
 
126
  st.header("Memory consumption")
127
  st.caption("MHA")
128
- c1, c2 = st.columns(2, 4)
129
  num_params = 12*l*d*d
130
  c1.write("Num Parameters (in B)")
131
  c2.write(str(round(num_params/1e9, 3)))
 
86
 
87
  return exec_time
88
 
 
 
89
  st.sidebar.header("Transformer parameters")
90
  col1, col2 = st.sidebar.columns([2, 4])
91
 
 
113
  mqa_time = shared_time + qkv_mqa_exec(bs, h, i, d)[2] + att1_mqa_exec(bs, h, i, d)[2] + att2_mqa_exec(bs, h, i, d)[2]
114
  mqa_total_time += l*mqa_time
115
 
116
+ c1, c2 = st.columns([2, 4])
117
  c1.write("Multi-Head Attention:")
118
  c2.write(str(round(mha_total_time, 2)))
119
  c1.write("Multi-Query Attention:")
 
123
 
124
  st.header("Memory consumption")
125
  st.caption("MHA")
126
+ c1, c2 = st.columns([2, 4])
127
  num_params = 12*l*d*d
128
  c1.write("Num Parameters (in B)")
129
  c2.write(str(round(num_params/1e9, 3)))