Spaces:

yabramuvdi
/

llms-demo

Running

App Files Files Community

llms-demo / app.py

yabramuvdi

Update app.py

899bbf4 verified 5 months ago

raw

history blame contribute delete

5.36 kB

	import os
	# Handle Spaces GPU
	if os.environ.get("SPACES_ZERO_GPU") is not None:
	import spaces
	else:
	class spaces:
	@staticmethod
	def GPU(func):
	def wrapper(args, *kwargs):
	return func(args, *kwargs)
	return wrapper

	@spaces.GPU
	def fake_gpu():
	pass

	import numpy as np
	import pandas as pd
	import torch
	import gradio as gr
	import matplotlib.pyplot as plt
	from transformers import AutoModelForCausalLM, AutoTokenizer
	import spaces
	from huggingface_hub import login

	# Authenticate
	HF_TOKEN = os.getenv('HF_TOKEN')
	login(token=HF_TOKEN)

	# Modelos disponibles
	AVAILABLE_MODELS = {
	"BLOOMZ-560M": "bigscience/bloomz-560m"
	}

	# Inicializar modelo y tokenizer
	current_model = None
	current_tokenizer = None
	current_model_name = None
	device = "cuda" if torch.cuda.is_available() else "cpu"

	def cargar_modelo(nombre_modelo):
	"""Carga el modelo y el tokenizer seleccionado."""
	global current_model, current_tokenizer, current_model_name
	if current_model_name != nombre_modelo:
	current_model = AutoModelForCausalLM.from_pretrained(AVAILABLE_MODELS[nombre_modelo]).to(device)
	current_tokenizer = AutoTokenizer.from_pretrained(AVAILABLE_MODELS[nombre_modelo])
	current_model_name = nombre_modelo

	# Cargar el modelo por defecto
	cargar_modelo("BLOOMZ-560M")

	@spaces.GPU()
	def obtener_predicciones(texto, nombre_modelo, top_k=10):
	"""Genera las predicciones de las siguientes palabras con sus probabilidades."""
	global current_model, current_tokenizer

	# Cargar modelo si ha cambiado
	if current_model_name != nombre_modelo:
	cargar_modelo(nombre_modelo)

	entradas = current_tokenizer(texto.strip(), return_tensors="pt").to(device)

	with torch.no_grad():
	salidas = current_model(**entradas)
	logits = salidas.logits[0, -1, :]
	probabilidades = torch.nn.functional.softmax(logits, dim=-1)

	top_k_prob, top_k_indices = torch.topk(probabilidades, k=top_k)
	top_k_tokens = [current_tokenizer.decode([idx.item()]).strip() for idx in top_k_indices] # ✅ Strip spaces

	return top_k_tokens, top_k_prob.cpu().tolist()

	def generar_barplot(tokens, probabilidades):
	"""Convierte los datos en un DataFrame y lo ordena de mayor a menor probabilidad."""
	df = pd.DataFrame({"Palabra": tokens, "Probabilidad": probabilidades})
	df = df.sort_values(by="Probabilidad", ascending=False) # ✅ Sort by probability (highest first)
	return df

	def predecir_siguiente_palabra(nombre_modelo, texto, top_k, token_custom=""):
	"""Obtiene predicciones y actualiza la UI."""
	if token_custom:
	texto = texto.rstrip() + " " + token_custom.strip() # ✅ Prevents extra whitespaces

	tokens, probabilidades = obtener_predicciones(texto, nombre_modelo, int(top_k))

	# Generar gráfico con Gradio BarPlot (ahora ordenado)
	barplot_data = generar_barplot(tokens, probabilidades)

	return gr.update(choices=[f"'{t}'" for t in tokens]), barplot_data

	def agregar_token_seleccionado(texto, token_seleccionado):
	"""Agrega el token seleccionado al texto de entrada sin espacios extra."""
	if token_seleccionado:
	token_limpio = token_seleccionado.strip("'").strip() # ✅ Removes unwanted spaces
	texto = texto.rstrip() + " " + token_limpio # ✅ Ensures no double spaces
	return texto

	# Crear la interfaz en español
	with gr.Blocks() as demo:
	gr.Markdown("# 🔥 Predicción de Texto con Modelos Transformadores")
	gr.Markdown(
	"Esta aplicación permite generar palabras utilizando un modelo de lenguaje. "
	"Selecciona un modelo, introduce un texto y explora las palabras más probables a continuación."
	)

	with gr.Row():
	dropdown_modelo = gr.Dropdown(
	choices=list(AVAILABLE_MODELS.keys()),
	value="BLOOMZ-560M",
	label="📌 Modelo de lenguaje"
	)

	dropdown_top_k = gr.Dropdown(
	choices=["5", "10", "15", "20"],
	value="10",
	label="🔢 Número de palabras a mostrar"
	)

	with gr.Row():
	texto_entrada = gr.Textbox(
	lines=5,
	label="📝 Texto de entrada",
	placeholder="Escribe aquí...",
	value=""
	)

	with gr.Row():
	boton_predecir = gr.Button("🔮 Predecir")

	with gr.Row():
	dropdown_tokens = gr.Dropdown(
	label="🔠 Palabras predichas",
	choices=[]
	)
	boton_agregar = gr.Button("➕ Agregar palabra")

	with gr.Row():
	barplot_resultados = gr.BarPlot(
	value=pd.DataFrame(columns=["Palabra", "Probabilidad"]), # ✅ Empty DataFrame to initialize
	x="Probabilidad", # ✅ Swap axes to make it horizontal
	y="Palabra",
	title="📊 Predicciones del modelo",
	orientation="h" # ✅ Makes the barplot horizontal
	)

	# Acciones de botones
	boton_predecir.click(
	predecir_siguiente_palabra,
	inputs=[dropdown_modelo, texto_entrada, dropdown_top_k],
	outputs=[dropdown_tokens, barplot_resultados]
	)

	boton_agregar.click(
	agregar_token_seleccionado,
	inputs=[texto_entrada, dropdown_tokens],
	outputs=texto_entrada
	)

	demo.queue().launch()