Spaces:

LLM360
/

k2-eval-gallery

Running

k2-eval-gallery / app.py

Suqi Sun

Upload results for 3 metrics

c173eef about 1 year ago

1.93 kB

	import os
	import streamlit as st
	import json
	import tarfile

	st.set_page_config(layout="wide")

	PARENT_PATH: str = os.path.join(os.path.dirname(os.path.abspath(__file__)))
	EVAL_DIR: str = os.path.join(PARENT_PATH, "eval-results")
	st.title("K2 Evaluation Gallery")
	st.markdown("""The K2 gallery allows one to browse the output of various evaluations on intermediate K2 checkpoints, which provides an intuitive understanding on how the model develops and improves over time.""")

	with st.sidebar:
	html = f"<img src='https://www.llm360.ai/images/logo-highres.png' width='100' /><img src='https://huggingface.co/spaces/LLM360/k2-gallery/blob/main/k2-logo.svg' width='100' />"
	st.markdown(html, unsafe_allow_html=True)

	metric = st.radio(
	"Choose a metric", options=os.listdir(os.path.join(EVAL_DIR))
	)

	n_shot = st.radio(
	"Selece an n-shot number", os.listdir(os.path.join(EVAL_DIR, metric))
	)

	col1, col2 = st.columns(2)

	with col1:
	st.header("Checkpoint A")
	ckpt = st.selectbox('Select a checkpoint', sorted(os.listdir(os.path.join(EVAL_DIR, metric, n_shot))), key="A1")
	st.write(f'Veiwing Evaluation Results for Checkpoint: `{ckpt}`')
	file = st.selectbox("Select a file", sorted(os.listdir(os.path.join(EVAL_DIR, metric, n_shot, ckpt))), key="A2")
	with tarfile.open(os.path.join(EVAL_DIR, metric, n_shot, ckpt, file), "r:gz") as f:
	st.json(json.load(f.extractfile(f.next())))

	with col2:
	st.header("Checkpoint B")
	ckpt = st.selectbox('Select a checkpoint', sorted(os.listdir(os.path.join(EVAL_DIR, metric, n_shot))), key="B1")
	st.write(f'Veiwing Evaluation Results for Checkpoint: `{ckpt}`')
	file = st.selectbox("Select a file", sorted(os.listdir(os.path.join(EVAL_DIR, metric, n_shot, ckpt))), key="B2")
	with tarfile.open(os.path.join(EVAL_DIR, metric, n_shot, ckpt, file), "r:gz") as f:
	st.json(json.load(f.extractfile(f.next())))