Spaces:

Vokturz
/

can-it-run-llm

Running

Vokturz commited on Oct 3, 2023

Commit

74c26d6

1 Parent(s): 204281c

fix typo

Files changed (1) hide show

src/app.py CHANGED Viewed

@@ -87,7 +87,7 @@ lora_pct = st.sidebar.slider("LoRa % trainable parameters", 0.1, 100.0, 2.0, ste
 st.sidebar.dataframe(gpu_spec.T)
 memory_table = pd.DataFrame(st.session_state[model_name][1]).set_index('dtype')
-memory_table['LoRA Fine-Tunning (GB)'] = (memory_table["Total Size (GB)"] +
                                           (memory_table["Parameters (Billion)"]* lora_pct/100 * (16/8)*4)) * 1.2
 _, col, _ = st.columns([1,3,1])
@@ -99,7 +99,7 @@ with col.expander("Information", expanded=True):
     where is estimated as """)
     st.latex(r"""\text{Memory}_\text{Inference} \approx \text{Model Size} \times 1.2""")
-    st.markdown("""- For LoRa Fine-tunning, I'm asuming a **16-bit** dtype of trainable parameters. The formula (in terms of GB) is""")
     st.latex(r"\text{Memory}_\text{LoRa} \approx \text{Model Size} + \left(\text{ \# trainable Params}_\text{Billions}\times\frac{16}{8} \times 4\right) \times 1.2")
     st.markdown("- You can understand `int4` as models in `GPTQ-4bit`, `AWQ-4bit` or `Q4_0 GGUF/GGML` formats")

 st.sidebar.dataframe(gpu_spec.T)
 memory_table = pd.DataFrame(st.session_state[model_name][1]).set_index('dtype')
+memory_table['LoRA Fine-Tuning (GB)'] = (memory_table["Total Size (GB)"] +
                                           (memory_table["Parameters (Billion)"]* lora_pct/100 * (16/8)*4)) * 1.2
 _, col, _ = st.columns([1,3,1])
     where is estimated as """)
     st.latex(r"""\text{Memory}_\text{Inference} \approx \text{Model Size} \times 1.2""")
+    st.markdown("""- For LoRa Fine-tuning, I'm asuming a **16-bit** dtype of trainable parameters. The formula (in terms of GB) is""")
     st.latex(r"\text{Memory}_\text{LoRa} \approx \text{Model Size} + \left(\text{ \# trainable Params}_\text{Billions}\times\frac{16}{8} \times 4\right) \times 1.2")
     st.markdown("- You can understand `int4` as models in `GPTQ-4bit`, `AWQ-4bit` or `Q4_0 GGUF/GGML` formats")