Spaces:

Ntdeseb
/

ntia

Running

App Files Files Community

ntia / app.py

Ntdeseb

Arreglando acceso a modelos - FLUX requiere permisos, usando modelos libres por defecto

36c2ab8 about 2 months ago

raw

history blame

15 kB

	import gradio as gr
	import torch
	from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
	from diffusers import StableDiffusionPipeline, DiffusionPipeline
	import requests
	from PIL import Image
	import io
	import base64

	# Configuración de modelos libres
	MODELS = {
	"text": {
	"microsoft/DialoGPT-medium": "Chat conversacional",
	"microsoft/DialoGPT-large": "Chat conversacional avanzado",
	"microsoft/DialoGPT-small": "Chat conversacional rápido",
	"gpt2": "Generación de texto",
	"gpt2-medium": "GPT-2 mediano",
	"gpt2-large": "GPT-2 grande",
	"distilgpt2": "GPT-2 optimizado",
	"EleutherAI/gpt-neo-125M": "GPT-Neo pequeño",
	"EleutherAI/gpt-neo-1.3B": "GPT-Neo mediano",
	"microsoft/DialoGPT-medium": "Chat conversacional",
	"facebook/opt-125m": "OPT pequeño",
	"facebook/opt-350m": "OPT mediano",
	"bigscience/bloom-560m": "BLOOM multilingüe",
	"bigscience/bloom-1b1": "BLOOM grande",
	"microsoft/DialoGPT-medium": "Chat conversacional",
	"Helsinki-NLP/opus-mt-es-en": "Traductor español-inglés",
	"Helsinki-NLP/opus-mt-en-es": "Traductor inglés-español"
	},
	"image": {
	"CompVis/stable-diffusion-v1-4": "Stable Diffusion v1.4 (Libre)",
	"stabilityai/stable-diffusion-2-1": "Stable Diffusion 2.1",
	"stabilityai/stable-diffusion-xl-base-1.0": "SDXL Base",
	"stabilityai/stable-diffusion-3-medium": "SD 3 Medium",
	"prompthero/openjourney": "Midjourney Style",
	"WarriorMama777/OrangeMixs": "Orange Mixs",
	"hakurei/waifu-diffusion": "Waifu Diffusion",
	"black-forest-labs/FLUX.1-schnell": "FLUX.1 Schnell (Requiere acceso)",
	"black-forest-labs/FLUX.1-dev": "FLUX.1 Dev (Requiere acceso)"
	},
	"chat": {
	"microsoft/DialoGPT-medium": "Chat conversacional",
	"microsoft/DialoGPT-large": "Chat conversacional avanzado",
	"microsoft/DialoGPT-small": "Chat conversacional rápido",
	"facebook/opt-350m": "OPT conversacional",
	"bigscience/bloom-560m": "BLOOM multilingüe"
	}
	}

	# Cache para los modelos
	model_cache = {}

	def load_text_model(model_name):
	"""Cargar modelo de texto con soporte para diferentes tipos"""
	if model_name not in model_cache:
	print(f"Cargando modelo de texto: {model_name}")

	# Detectar tipo de modelo
	if "opus-mt" in model_name.lower():
	# Modelo de traducción
	from transformers import MarianMTModel, MarianTokenizer
	tokenizer = MarianTokenizer.from_pretrained(model_name)
	model = MarianMTModel.from_pretrained(model_name)
	else:
	# Modelo de generación de texto
	tokenizer = AutoTokenizer.from_pretrained(model_name)
	model = AutoModelForCausalLM.from_pretrained(model_name)

	# Configurar para chat si es DialoGPT
	if "dialogpt" in model_name.lower():
	tokenizer.pad_token = tokenizer.eos_token
	model.config.pad_token_id = model.config.eos_token_id

	model_cache[model_name] = {
	"tokenizer": tokenizer,
	"model": model,
	"type": "text"
	}

	return model_cache[model_name]

	def load_image_model(model_name):
	"""Cargar modelo de imagen - versión simplificada con soporte para FLUX"""
	if model_name not in model_cache:
	print(f"Cargando modelo de imagen: {model_name}")

	# Configuración especial para FLUX
	if "flux" in model_name.lower():
	try:
	from diffusers import FluxPipeline
	pipe = FluxPipeline.from_pretrained(
	model_name,
	torch_dtype=torch.bfloat16
	)
	pipe.enable_model_cpu_offload()
	except Exception as e:
	print(f"Error cargando FLUX: {e}")
	# Fallback a Stable Diffusion
	pipe = StableDiffusionPipeline.from_pretrained(
	"CompVis/stable-diffusion-v1-4",
	torch_dtype=torch.float32,
	safety_checker=None
	)
	else:
	# Configuración básica para otros modelos
	pipe = StableDiffusionPipeline.from_pretrained(
	model_name,
	torch_dtype=torch.float32,
	safety_checker=None
	)

	# Solo optimización básica de memoria
	pipe.enable_attention_slicing()

	model_cache[model_name] = {
	"pipeline": pipe,
	"type": "image"
	}

	return model_cache[model_name]

	def generate_text(prompt, model_name, max_length=100):
	"""Generar texto con el modelo seleccionado - mejorado para diferentes tipos"""
	try:
	model_data = load_text_model(model_name)
	tokenizer = model_data["tokenizer"]
	model = model_data["model"]

	# Detectar si es modelo de traducción
	if "opus-mt" in model_name.lower():
	# Traducción
	inputs = tokenizer.encode(prompt, return_tensors="pt", max_length=512, truncation=True)
	with torch.no_grad():
	outputs = model.generate(inputs, max_length=max_length, num_beams=4, early_stopping=True)
	response = tokenizer.decode(outputs[0], skip_special_tokens=True)
	else:
	# Generación de texto
	inputs = tokenizer.encode(prompt, return_tensors="pt")

	# Generar
	with torch.no_grad():
	outputs = model.generate(
	inputs,
	max_length=max_length,
	num_return_sequences=1,
	temperature=0.7,
	do_sample=True,
	pad_token_id=tokenizer.eos_token_id
	)

	# Decodificar respuesta
	response = tokenizer.decode(outputs[0], skip_special_tokens=True)

	# Para DialoGPT, extraer solo la respuesta del asistente
	if "dialogpt" in model_name.lower():
	response = response.replace(prompt, "").strip()

	return response

	except Exception as e:
	return f"Error generando texto: {str(e)}"

	def generate_image(prompt, model_name, num_inference_steps=20):
	"""Generar imagen con el modelo seleccionado - versión simplificada con soporte para FLUX"""
	try:
	print(f"Generando imagen con modelo: {model_name}")
	print(f"Prompt: {prompt}")
	print(f"Pasos: {num_inference_steps}")

	model_data = load_image_model(model_name)
	pipeline = model_data["pipeline"]

	# Configuración específica para FLUX
	if "flux" in model_name.lower():
	image = pipeline(
	prompt,
	guidance_scale=0.0,
	num_inference_steps=4, # FLUX usa solo 4 pasos
	max_sequence_length=256,
	generator=torch.Generator("cpu").manual_seed(0)
	).images[0]
	else:
	# Configuración básica para otros modelos
	image = pipeline(
	prompt,
	num_inference_steps=num_inference_steps,
	guidance_scale=7.5
	).images[0]

	print("Imagen generada exitosamente")
	return image

	except Exception as e:
	print(f"Error generando imagen: {str(e)}")
	return f"Error generando imagen: {str(e)}"

	def chat_with_model(message, history, model_name):
	"""Función de chat para DialoGPT con formato de mensajes actualizado"""
	try:
	model_data = load_text_model(model_name)
	tokenizer = model_data["tokenizer"]
	model = model_data["model"]

	# Construir historial de conversación desde el nuevo formato
	conversation = ""
	for msg in history:
	if msg["role"] == "user":
	conversation += f"User: {msg['content']}\n"
	elif msg["role"] == "assistant":
	conversation += f"Assistant: {msg['content']}\n"

	conversation += f"User: {message}\nAssistant:"

	# Generar respuesta
	inputs = tokenizer.encode(conversation, return_tensors="pt", truncation=True, max_length=512)

	with torch.no_grad():
	outputs = model.generate(
	inputs,
	max_length=inputs.shape[1] + 50,
	temperature=0.7,
	do_sample=True,
	pad_token_id=tokenizer.eos_token_id
	)

	response = tokenizer.decode(outputs[0], skip_special_tokens=True)

	# Extraer solo la respuesta del asistente
	response = response.split("Assistant:")[-1].strip()

	# Retornar el historial actualizado con el nuevo formato
	history.append({"role": "user", "content": message})
	history.append({"role": "assistant", "content": response})

	return history

	except Exception as e:
	error_msg = f"Error en el chat: {str(e)}"
	history.append({"role": "user", "content": message})
	history.append({"role": "assistant", "content": error_msg})
	return history

	# Interfaz de Gradio
	with gr.Blocks(title="Modelos Libres de IA", theme=gr.themes.Soft()) as demo:
	gr.Markdown("# 🤖 Modelos Libres de IA")
	gr.Markdown("### Genera texto e imágenes sin límites de cuota")

	with gr.Tabs():
	# Tab de Generación de Texto
	with gr.TabItem("📝 Generación de Texto"):
	with gr.Row():
	with gr.Column():
	text_model = gr.Dropdown(
	choices=list(MODELS["text"].keys()),
	value="microsoft/DialoGPT-medium",
	label="Modelo de Texto"
	)
	text_prompt = gr.Textbox(
	label="Prompt",
	placeholder="Escribe tu prompt aquí...",
	lines=3
	)
	max_length = gr.Slider(
	minimum=50,
	maximum=200,
	value=100,
	step=10,
	label="Longitud máxima"
	)
	text_btn = gr.Button("Generar Texto", variant="primary")

	with gr.Column():
	text_output = gr.Textbox(
	label="Resultado",
	lines=10,
	interactive=False
	)

	text_btn.click(
	generate_text,
	inputs=[text_prompt, text_model, max_length],
	outputs=text_output
	)

	# Tab de Chat
	with gr.TabItem("💬 Chat"):
	with gr.Row():
	with gr.Column():
	chat_model = gr.Dropdown(
	choices=list(MODELS["chat"].keys()),
	value="microsoft/DialoGPT-medium",
	label="Modelo de Chat"
	)

	with gr.Column():
	chatbot = gr.Chatbot(
	label="Chat",
	height=400,
	type="messages"
	)
	chat_input = gr.Textbox(
	label="Mensaje",
	placeholder="Escribe tu mensaje...",
	lines=2
	)
	chat_btn = gr.Button("Enviar", variant="primary")

	chat_btn.click(
	chat_with_model,
	inputs=[chat_input, chatbot, chat_model],
	outputs=[chatbot]
	)

	chat_input.submit(
	chat_with_model,
	inputs=[chat_input, chatbot, chat_model],
	outputs=[chatbot]
	)

	# Tab de Traducción
	with gr.TabItem("🌐 Traducción"):
	with gr.Row():
	with gr.Column():
	translate_model = gr.Dropdown(
	choices=["Helsinki-NLP/opus-mt-es-en", "Helsinki-NLP/opus-mt-en-es"],
	value="Helsinki-NLP/opus-mt-es-en",
	label="Modelo de Traducción"
	)
	translate_text = gr.Textbox(
	label="Texto a traducir",
	placeholder="Escribe el texto que quieres traducir...",
	lines=3
	)
	translate_btn = gr.Button("Traducir", variant="primary")

	with gr.Column():
	translate_output = gr.Textbox(
	label="Traducción",
	lines=3,
	interactive=False
	)

	translate_btn.click(
	generate_text,
	inputs=[translate_text, translate_model, gr.Slider(value=100, visible=False)],
	outputs=translate_output
	)

	# Tab de Generación de Imágenes
	with gr.TabItem("🎨 Generación de Imágenes"):
	with gr.Row():
	with gr.Column():
	image_model = gr.Dropdown(
	choices=list(MODELS["image"].keys()),
	value="CompVis/stable-diffusion-v1-4",
	label="Modelo de Imagen"
	)
	image_prompt = gr.Textbox(
	label="Prompt de Imagen",
	placeholder="Describe la imagen que quieres generar...",
	lines=3
	)
	steps = gr.Slider(
	minimum=10,
	maximum=50,
	value=15,
	step=5,
	label="Pasos de inferencia"
	)
	image_btn = gr.Button("Generar Imagen", variant="primary")

	with gr.Column():
	image_output = gr.Image(
	label="Imagen Generada",
	type="pil"
	)

	image_btn.click(
	generate_image,
	inputs=[image_prompt, image_model, steps],
	outputs=image_output
	)

	# Configuración para Hugging Face Spaces
	if __name__ == "__main__":
	demo.launch(
	server_name="0.0.0.0",
	server_port=7860,
	share=False
	)