Spaces:

yabramuvdi
/

llms-demo

Sleeping

App Files Files Community

llms-demo / app.py

yabramuvdi

Update app.py

7c2299f verified 10 months ago

raw

history blame

5.01 kB

	import os
	# Handle Spaces GPU
	if os.environ.get("SPACES_ZERO_GPU") is not None:
	import spaces
	else:
	class spaces:
	@staticmethod
	def GPU(func):
	def wrapper(args, *kwargs):
	return func(args, *kwargs)
	return wrapper

	@spaces.GPU
	def fake_gpu():
	pass

	import numpy as np
	import pandas as pd
	import torch
	import gradio as gr
	import matplotlib.pyplot as plt
	from transformers import AutoModelForCausalLM, AutoTokenizer
	import spaces
	from huggingface_hub import login

	# Authenticate
	HF_TOKEN = os.getenv('HF_TOKEN')
	login(token=HF_TOKEN)

	# Modelos disponibles
	AVAILABLE_MODELS = {
	"BLOOMZ-560M": "bigscience/bloomz-560m"
	}

	# Inicializar modelo y tokenizer
	current_model = None
	current_tokenizer = None
	current_model_name = None
	device = "cuda" if torch.cuda.is_available() else "cpu"

	def cargar_modelo(nombre_modelo):
	"""Carga el modelo y el tokenizer seleccionado."""
	global current_model, current_tokenizer, current_model_name
	if current_model_name != nombre_modelo:
	current_model = AutoModelForCausalLM.from_pretrained(AVAILABLE_MODELS[nombre_modelo]).to(device)
	current_tokenizer = AutoTokenizer.from_pretrained(AVAILABLE_MODELS[nombre_modelo])
	current_model_name = nombre_modelo

	# Cargar el modelo por defecto
	cargar_modelo("BLOOMZ-560M")

	@spaces.GPU()
	def obtener_predicciones(texto, nombre_modelo, top_k=10):
	"""Genera las predicciones de las siguientes palabras con sus probabilidades."""
	global current_model, current_tokenizer

	# Cargar modelo si ha cambiado
	if current_model_name != nombre_modelo:
	cargar_modelo(nombre_modelo)

	entradas = current_tokenizer(texto, return_tensors="pt").to(device)

	with torch.no_grad():
	salidas = current_model(**entradas)
	logits = salidas.logits[0, -1, :]
	probabilidades = torch.nn.functional.softmax(logits, dim=-1)

	top_k_prob, top_k_indices = torch.topk(probabilidades, k=top_k)
	top_k_tokens = [current_tokenizer.decode([idx.item()]) for idx in top_k_indices]

	return top_k_tokens, top_k_prob.cpu().tolist()

	def generar_barplot(tokens, probabilidades):
	"""Convierte los datos en un DataFrame para Gradio BarPlot."""
	df = pd.DataFrame({"Palabra": tokens, "Probabilidad": probabilidades})
	print(df)
	return df # ✅ Now returning a Pandas DataFrame instead of a list

	def predecir_siguiente_palabra(nombre_modelo, texto, top_k, token_custom=""):
	"""Obtiene predicciones y actualiza la UI."""
	if token_custom:
	texto += token_custom

	tokens, probabilidades = obtener_predicciones(texto, nombre_modelo, int(top_k))

	# Generar gráfico con Gradio BarPlot
	barplot_data = generar_barplot(tokens, probabilidades)

	return gr.update(choices=[f"'{t}'" for t in tokens]), barplot_data

	def agregar_token_seleccionado(texto, token_seleccionado):
	"""Agrega el token seleccionado al texto de entrada."""
	if token_seleccionado:
	token_limpio = token_seleccionado.strip("'")
	texto += f" {token_limpio}"
	return texto

	# Crear la interfaz en español
	with gr.Blocks() as demo:
	gr.Markdown("# 🔥 Predicción de Texto con Modelos Transformadores")
	gr.Markdown(
	"Esta aplicación permite generar palabras utilizando un modelo de lenguaje. "
	"Selecciona un modelo, introduce un texto y explora las palabras más probables a continuación."
	)

	with gr.Row():
	dropdown_modelo = gr.Dropdown(
	choices=list(AVAILABLE_MODELS.keys()),
	value="BLOOMZ-560M",
	label="📌 Modelo de lenguaje"
	)

	dropdown_top_k = gr.Dropdown(
	choices=["5", "10", "15", "20"],
	value="10",
	label="🔢 Número de palabras a mostrar"
	)

	with gr.Row():
	texto_entrada = gr.Textbox(
	lines=5,
	label="📝 Texto de entrada",
	placeholder="Escribe aquí...",
	value="Mi abuela me dejó una gran"
	)

	with gr.Row():
	boton_predecir = gr.Button("🔮 Predecir")

	with gr.Row():
	dropdown_tokens = gr.Dropdown(
	label="🔠 Palabras predichas",
	choices=[]
	)
	boton_agregar = gr.Button("➕ Agregar palabra")

	with gr.Row():
	barplot_resultados = gr.BarPlot(
	value=pd.DataFrame(columns=["Palabra", "Probabilidad"]), # ✅ Empty DataFrame to initialize
	x="Palabra",
	y="Probabilidad",
	title="📊 Predicciones del modelo"
	)

	# Acciones de botones
	boton_predecir.click(
	predecir_siguiente_palabra,
	inputs=[dropdown_modelo, texto_entrada, dropdown_top_k],
	outputs=[dropdown_tokens, barplot_resultados]
	)

	boton_agregar.click(
	agregar_token_seleccionado,
	inputs=[texto_entrada, dropdown_tokens],
	outputs=texto_entrada
	)

	demo.queue().launch()