Spaces:

C2MV
/

BioRAG

Sleeping

App Files Files Community

BioRAG / model_app.py

C2MV

Upload 3 files

de3a711 verified about 1 month ago

raw

history blame

7.75 kB

	# modal_app.py
	import modal
	import sys
	from pathlib import Path
	import os
	import traceback

	# --- Configuración ---
	PYTHON_VERSION = "3.10"
	APP_NAME = "bioprocess-custom-eq-agent-modal"
	LOCAL_APP_DIR = Path(__file__).parent
	REMOTE_APP_DIR = "/app"

	stub = modal.Stub(APP_NAME)

	app_image = (
	modal.Image.debian_slim(python_version=PYTHON_VERSION)
	.pip_install_from_requirements(LOCAL_APP_DIR / "requirements.txt")
	.copy_mount(
	modal.Mount.from_local_dir(LOCAL_APP_DIR, remote_path=REMOTE_APP_DIR)
	)
	.env({
	"PYTHONPATH": REMOTE_APP_DIR,
	"HF_HOME": "/cache/huggingface",
	"HF_HUB_CACHE": "/cache/huggingface/hub",
	"TRANSFORMERS_CACHE": "/cache/huggingface/hub",
	"MPLCONFIGDIR": "/tmp/matplotlib_cache"
	})
	.run_commands(
	"apt-get update && apt-get install -y git git-lfs && rm -rf /var/lib/apt/lists/*",
	"mkdir -p /cache/huggingface/hub /tmp/matplotlib_cache"
	)
	)

	# --- Función Modal para LLM (sin cambios respecto a la anterior respuesta completa) ---
	@stub.function(
	image=app_image, # Hereda la imagen base del stub si está definida, o usa esta.
	gpu="any",
	secrets=[modal.Secret.from_name("huggingface-read-token", optional=True)],
	timeout=600, # 10 minutos
	volumes={"/cache/huggingface": modal.Volume.persisted(f"{APP_NAME}-hf-cache-vol")}
	)
	def generate_analysis_llm_modal_remote(prompt: str, model_path_config: str, max_new_tokens_config: int) -> str:
	import torch # Importaciones pesadas dentro de la función Modal
	from transformers import AutoTokenizer, AutoModelForCausalLM

	hf_token = os.environ.get("HUGGING_FACE_TOKEN")
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	print(f"LLM Modal Func: Usando dispositivo: {device}")
	print(f"LLM Modal Func: Cargando modelo: {model_path_config} con token: {'Sí' if hf_token else 'No'}")

	try:
	tokenizer = AutoTokenizer.from_pretrained(model_path_config, cache_dir="/cache/huggingface/hub", token=hf_token, trust_remote_code=True)
	model = AutoModelForCausalLM.from_pretrained(
	model_path_config,
	torch_dtype="auto",
	device_map="auto",
	cache_dir="/cache/huggingface/hub",
	token=hf_token,
	trust_remote_code=True # Necesario para algunos modelos como Qwen
	)

	model_context_window = getattr(model.config, 'max_position_embeddings', getattr(model.config, 'sliding_window', 4096)) # Para Qwen2 sliding_window
	if model_context_window is None : model_context_window = 4096 # Fallback

	max_prompt_len = model_context_window - max_new_tokens_config - 50 # Buffer
	if max_prompt_len <=0 : max_prompt_len = model_context_window // 2 # Si max_new_tokens es muy grande

	inputs = tokenizer(prompt, return_tensors="pt", truncation=True, max_length=max_prompt_len).to(model.device)

	with torch.no_grad():
	outputs = model.generate(
	**inputs,
	max_new_tokens=max_new_tokens_config,
	eos_token_id=tokenizer.eos_token_id,
	pad_token_id=tokenizer.pad_token_id if tokenizer.pad_token_id is not None else tokenizer.eos_token_id,
	do_sample=True,
	temperature=0.6,
	top_p=0.9,
	)

	input_length = inputs.input_ids.shape[1]
	generated_ids = outputs[0][input_length:]
	analysis = tokenizer.decode(generated_ids, skip_special_tokens=True)

	print(f"LLM Modal Func: Longitud del análisis generado: {len(analysis)} caracteres.")
	return analysis.strip()
	except Exception as e:
	error_traceback = traceback.format_exc()
	print(f"Error en generate_analysis_llm_modal_remote: {e}\n{error_traceback}")
	return f"Error al generar análisis con el modelo LLM: {str(e)}"

	# --- Servidor Gradio ---
	@stub.asgi_app(image=app_image) # Especificar la imagen para el endpoint ASGI también
	def serve_gradio_app_asgi():
	import gradio as gr

	# sys.path ya está configurado por la imagen de Modal debido a .env({"PYTHONPATH": REMOTE_APP_DIR})
	# y .copy_mount(... remote_path=REMOTE_APP_DIR)
	# No obstante, una comprobación o inserción explícita no daña:
	if REMOTE_APP_DIR not in sys.path:
	sys.path.insert(0, REMOTE_APP_DIR)
	print(f"INFO (modal_app.py): Añadido {REMOTE_APP_DIR} a sys.path")

	# --- Intento de Neutralizar el decorador problemático ANTES de las importaciones de la app ---
	# Esto es para evitar el error "No @spaces.GPU function detected" si Gradio lo busca.
	try:
	import decorators # Intenta importar TU decorators.py
	class _GPUNeutralizerModal:
	def __init__(self, args, *kwargs): pass
	def __call__(self, func): return func

	if hasattr(decorators, 'GPU'):
	decorators.GPU = _GPUNeutralizerModal
	print("INFO (modal_app.py): 'decorators.GPU' neutralizado para el entorno Modal.")
	if hasattr(decorators, 'gpu_decorator'):
	decorators.gpu_decorator = lambda duration=0: lambda func: func
	print("INFO (modal_app.py): 'decorators.gpu_decorator' neutralizado para el entorno Modal.")
	except ImportError:
	print("ADVERTENCIA (modal_app.py): Módulo 'decorators' no encontrado durante la neutralización. Esto puede ser OK.")
	except Exception as e_neut:
	print(f"ADVERTENCIA (modal_app.py): Error durante la neutralización de decoradores: {e_neut}")
	# --- Fin de la neutralización ---

	# Importar los módulos de la aplicación AHORA
	from UI import create_interface
	import interface as app_interface_module
	from config import MODEL_PATH as cfg_MODEL_PATH, MAX_LENGTH as cfg_MAX_LENGTH

	# Wrapper para llamar a la función Modal remota desde tu interface.py
	def analysis_func_wrapper_for_interface_modal(prompt: str) -> str:
	print("Gradio Backend (Modal): Llamando a generate_analysis_llm_modal_remote.remote...")
	return generate_analysis_llm_modal_remote.remote(prompt, cfg_MODEL_PATH, cfg_MAX_LENGTH)

	# Inyectar esta función wrapper en el módulo `interface` que usa Gradio
	app_interface_module.generate_analysis_from_modal = analysis_func_wrapper_for_interface_modal
	app_interface_module.USE_MODAL_FOR_LLM_ANALYSIS = True
	print("INFO (modal_app.py): Runner de LLM Modal inyectado en el módulo 'interface'.")

	# Crear la app Gradio, pasándole la función de procesamiento real
	gradio_ui_instance = create_interface(process_function_for_button=app_interface_module.process_and_plot)

	print("INFO (modal_app.py): Interfaz Gradio creada y lista para ser servida.")
	return gr.routes.App.create_app(gradio_ui_instance)

	@stub.local_entrypoint()
	def test_llm_local_entry(): # Renombrado para evitar conflicto con el `test_llm` de la respuesta anterior
	print("Probando la generación de LLM con Modal (local_entrypoint)...")
	if REMOTE_APP_DIR not in sys.path: # Asegurar path para pruebas locales también
	sys.path.insert(0, str(LOCAL_APP_DIR))
	from config import MODEL_PATH, MAX_LENGTH

	sample_prompt = "Explica brevemente el concepto de R cuadrado (R²) en el ajuste de modelos."
	try:
	# Para ejecutar esto, necesitarías que el stub esté activo.
	# `modal run modal_app.py test_llm_local_entry`
	analysis = generate_analysis_llm_modal_remote.remote(sample_prompt, MODEL_PATH, MAX_LENGTH)
	print("\nRespuesta del LLM:")
	print(analysis)
	except Exception as e:
	print(f"Error durante test_llm_local_entry: {e}")
	traceback.print_exc()