import gradio as gr

gr.load("models/HF1BitLLM/Llama3-8B-1.58-100B-tokens").launch()