Spaces:

warshanks
/

seinfeld

Sleeping

File size: 12,247 Bytes

import gradio as gr
import asyncio
import threading
import os
from io import BytesIO
from dotenv import load_dotenv
from google import genai
from google.genai.types import Part, FileData, Tool, GenerateContentConfig, GoogleSearch, Content

# Import Discord functionality
import discord
from discord import app_commands
from discord.ext import commands

load_dotenv()

# Environment variables
GOOGLE_KEY = os.getenv("GOOGLE_KEY")
DISCORD_TOKEN = os.getenv("DISCORD_TOKEN")
CHANNEL_ID = os.getenv("CHANNEL_ID")
ADDITIONAL_CHANNELS = os.getenv("ADDITIONAL_CHANNELS", "")

# Parse channel IDs for Discord bot
TARGET_CHANNEL_IDS = []
if CHANNEL_ID:
    TARGET_CHANNEL_IDS.append(int(CHANNEL_ID))
if ADDITIONAL_CHANNELS:
    ADDITIONAL_IDS = [int(channel_id.strip()) for channel_id in ADDITIONAL_CHANNELS.split(",") if channel_id.strip()]
    TARGET_CHANNEL_IDS.extend(ADDITIONAL_IDS)

# Model configuration - centralized model definitions
MODEL_DEFINITIONS = {
    "flash": "gemini-2.0-flash",
    "pro": "gemini-2.5-pro-preview-05-06",
    "image": "imagen-3.0-generate-002"
}

# Default models
chat_model_id = MODEL_DEFINITIONS["flash"]  # Default to flash model
image_model_id = MODEL_DEFINITIONS["image"]

# Initialize Google client
google_client = None
if GOOGLE_KEY:
    google_client = genai.Client(api_key=GOOGLE_KEY)

# Default system instruction (fallback if environment variable not set)
DEFAULT_SYSTEM_INSTRUCTION = ""

# Get system instruction from environment variable or use default
SYSTEM_INSTRUCTION = os.getenv("SYSTEM_INSTRUCTION", DEFAULT_SYSTEM_INSTRUCTION)

def respond_with_gemini(message, history):
    """Generate response using Google Gemini API with Seinfeld personality"""
    if not google_client:
        return "I need a Google API key to work! Set the GOOGLE_KEY environment variable."

    try:
        # Format history for Gemini API
        formatted_history = []
        for user_msg, assistant_msg in history:
            if user_msg:
                formatted_history.append(Content(role="user", parts=[Part(text=user_msg)]))
            if assistant_msg:
                formatted_history.append(Content(role="model", parts=[Part(text=assistant_msg)]))

        # Initialize Google Search tool
        google_search_tool = Tool(google_search=GoogleSearch())

        # Create chat
        chat = google_client.chats.create(
            model=chat_model_id,
            history=formatted_history,
            config=GenerateContentConfig(
                system_instruction=SYSTEM_INSTRUCTION,
                tools=[google_search_tool],
                response_modalities=["TEXT"]
            )
        )

        # Send message and get response
        response = chat.send_message(message)
        return response.text

    except Exception as e:
        print(f"Error with Gemini API: {e}")
        # Fallback to a Seinfeld-style response
        return f"What's the deal with API errors? I mean, you type something in, the computer thinks about it, and then... nothing! It's like asking your friend a question and they just stare at you. 'Hey, how are you?' *silence* 'Hello?' *more silence* It's the digital equivalent of being ignored at a party!"

def respond_gradio(message, history: list[tuple[str, str]]):
    """Response function for Gradio interface"""
    # Use Gemini with Seinfeld personality and default parameters
    response = respond_with_gemini(message, history)

    # Stream the response character by character for better UX
    partial_response = ""
    for char in response:
        partial_response += char
        yield partial_response

async def keep_typing(channel):
    """Continuously show the typing indicator until the task is cancelled."""
    print(f"Starting typing indicator in channel {channel.id}")
    try:
        while True:
            async with channel.typing():
                await asyncio.sleep(5)
    except asyncio.CancelledError:
        print(f"Typing indicator cancelled for channel {channel.id}")
        pass
    except Exception as e:
        print(f"Error in keep_typing: {type(e).__name__}: {str(e)}")

async def generate_image_bytes(prompt, google_client, image_model_id):
    """Generate an image using Gemini API and return the image bytes."""
    try:
        # Run image generation in a separate thread to avoid blocking the event loop
        def generate_image():
            response = google_client.models.generate_images(
                model=image_model_id,
                prompt=prompt,
                config=genai.types.GenerateImagesConfig(
                    number_of_images=1,
                    aspect_ratio="16:9"
                )
            )
            return response

        # Run the API call in a separate thread
        response = await asyncio.to_thread(generate_image)

        # Return the image bytes directly
        for generated_image in response.generated_images:
            return generated_image.image.image_bytes

        # If we get here, no images were generated
        print("ERROR: No images were generated in the response")
        raise Exception("No image was generated in the response")
    except Exception as e:
        print(f"Exception in image generation: {type(e).__name__}: {str(e)}")
        raise

async def handle_image_request(message, query, google_client, image_model_id):
    """Handle image generation requests from text messages."""
    if query.lower().startswith("generate image:") or query.lower().startswith("create image:"):
        # Start continuous typing in the background
        typing_task = asyncio.create_task(keep_typing(message.channel))

        try:
            prompt = query.split(":", 1)[1].strip()
            try:
                print(f"Generating image for prompt: {prompt[:30]}...")
                image_bytes = await generate_image_bytes(prompt, google_client, image_model_id)
                # Cancel typing before sending the response
                typing_task.cancel()
                # Send image directly from bytes without saving to disk
                await message.reply(f"Here's your image:", file=discord.File(BytesIO(image_bytes), filename="generated_image.png"))
            except Exception as e:
                print(f"Error generating image: {e}")
                # Cancel typing before sending the response
                typing_task.cancel()
                await message.reply("Sorry, I couldn't generate that image.")
        except Exception as e:
            # Make sure to cancel the typing task even if an error occurs
            typing_task.cancel()
            print(f"Exception during image generation: {e}")
            raise e
        return True
    return False

# Discord Bot Setup
discord_bot = None

async def setup_discord_bot():
    """Setup and run Discord bot"""
    if not DISCORD_TOKEN or not TARGET_CHANNEL_IDS:
        print("Discord bot disabled: Missing DISCORD_TOKEN or channel IDs")
        return

    global discord_bot

    # Initialize Discord bot
    intents = discord.Intents.default()
    intents.message_content = True
    discord_bot = commands.Bot(command_prefix="~", intents=intents)

    @discord_bot.event
    async def on_ready():
        print(f"Discord bot logged in as {discord_bot.user}")
        try:
            synced = await discord_bot.tree.sync()
            print(f"Synced {len(synced)} command(s)")
        except Exception as e:
            print(f"Failed to sync commands: {e}")

    @discord_bot.event
    async def on_message(message):
        await discord_bot.process_commands(message)

        if message.channel.id in TARGET_CHANNEL_IDS:
            if message.author == discord_bot.user:
                return
            if message.content.startswith('!') or message.content.startswith('~'):
                return
            if message.content.strip() == "":
                return

            # Check if this is an image generation request first
            if await handle_image_request(message, message.content, google_client, image_model_id):
                return

            # Show typing indicator
            async with message.channel.typing():
                # Get response using the same function as Gradio
                response = respond_with_gemini(message.content, [])

                # Split long responses
                if len(response) > 2000:
                    # Split by sentences to preserve formatting
                    sentences = response.split('. ')
                    current_msg = ""

                    for sentence in sentences:
                        if len(current_msg + sentence + '. ') > 1900:
                            if current_msg:
                                await message.reply(current_msg.strip())
                                current_msg = sentence + '. '
                            else:
                                # Single sentence too long, just send it
                                await message.reply(sentence[:1900] + "...")
                                current_msg = ""
                        else:
                            current_msg += sentence + '. '

                    if current_msg:
                        await message.channel.send(current_msg.strip())
                else:
                    await message.reply(response)

    @discord_bot.tree.command(name="model")
    @app_commands.describe(new_model_id="New model ID to use for Gemini API or shorthand ('flash', 'pro')")
    async def change_model(interaction: discord.Interaction, new_model_id: str):
        """Changes the Gemini chat model being used."""
        if not interaction.user.guild_permissions.administrator:
            await interaction.response.send_message("Only administrators can change the model.", ephemeral=True)
            return

        global chat_model_id

        # Use centralized model definitions
        actual_model_id = MODEL_DEFINITIONS.get(new_model_id.lower(), new_model_id)
        old_model = chat_model_id
        chat_model_id = actual_model_id

        await interaction.response.send_message(f"Chat model changed from `{old_model}` to `{actual_model_id}`", ephemeral=True)

    @discord_bot.tree.command(name="image")
    @app_commands.describe(prompt="Description of the image you want to generate")
    async def generate_image_command(interaction: discord.Interaction, prompt: str):
        """Generates an image using Gemini API based on the provided prompt."""
        await interaction.response.defer(thinking=True)

        try:
            image_bytes = await generate_image_bytes(prompt, google_client, image_model_id)
            await interaction.followup.send(f"Generated image based on: {prompt}", file=discord.File(BytesIO(image_bytes), filename="generated_image.png"))
        except Exception as e:
            print(f"Error generating image: {e}")
            await interaction.followup.send("Sorry, I couldn't generate that image.")

    # Run the bot
    await discord_bot.start(DISCORD_TOKEN)

def run_discord_bot():
    """Run Discord bot in separate thread"""
    try:
        asyncio.run(setup_discord_bot())
    except Exception as e:
        print(f"Discord bot error: {e}")

# Create Gradio interface
demo = gr.ChatInterface(
    respond_gradio,
    title="🥨 Seinfeld Chatbot",
    description="Chat with Jerry Seinfeld! What's the deal with chatbots anyway?",
    examples=[
        ["What's the deal with airplane food?"],
        ["Why do people say 'after dark' when it's really after light?"],
        ["What's up with people who take forever to order at restaurants?"],
        ["Why do we park in driveways and drive on parkways?"],
        ["Tell me about the soup nazi"],
        ["What's your take on people who don't return shopping carts?"],
    ],
    cache_examples=True,
)

if __name__ == "__main__":
    # Start Discord bot in separate thread if credentials are available
    if DISCORD_TOKEN and TARGET_CHANNEL_IDS:
        discord_thread = threading.Thread(target=run_discord_bot, daemon=True)
        discord_thread.start()
        print("Discord bot starting in background...")
    else:
        print("Discord bot disabled: Missing credentials or channel IDs")

    # Launch Gradio interface
    demo.launch()