wonderlore / app.py
GH111's picture
Update app.py
7ac2f8c
raw
history blame
3.31 kB
# Import libraries
import gradio as gr
from gtts import gTTS
from io import BytesIO
from PIL import Image
from diffusers import DiffusionPipeline
import openai
# Set your OpenAI API key
openai.api_key = "YOUR_OPENAI_API_KEY"
# Use a DiffusionPipeline for text-to-image
image_generation_pipe = DiffusionPipeline.from_pretrained("stabilityai/stable-video-diffusion-img2vid-xt")
# Set the context for the storyteller
messages = [{"role": "system", "content": "You are a magical storyteller, creating wonderful tales for kids. Make them imaginative and full of joy!"}]
# Initialize page number
current_page = 0
# Define the Storyteller function
def StorytellerGPT(character, child_name, lesson_choice, tell_story, _):
global current_page
# Set the characters and lesson based on user choices
character_info = f"Once upon a time, {child_name} met {character}. "
lesson_info = f"Today's lesson is about {lesson_choice}. "
messages.append({"role": "user", "content": tell_story})
# Generate story using OpenAI's GPT model
input_text = character_info + lesson_info + tell_story
story_reply = openai.Completion.create(
engine="text-davinci-003", # Adjust the engine based on your preferences
prompt=input_text,
max_tokens=150,
n=1,
stop=None
)["choices"][0]["text"]
messages.append({"role": "assistant", "content": story_reply})
# Convert text to speech using Whisper API
# Replace "YOUR_WHISPER_API_KEY" with your actual Whisper API key
whisper_api_key = "YOUR_WHISPER_API_KEY"
tts = gTTS(text=story_reply, lang='en', slow=False, whisper_api_key=whisper_api_key)
audio_io = BytesIO()
tts.save(audio_io)
audio_io.seek(0)
# Convert text to image using DiffusionPipeline
image_reply = image_generation_pipe(story_reply)
# Display the story on separate pages
story_pages = story_reply.split("\n\n") # Split the story into pages
current_page = min(current_page, len(story_pages) - 1) # Ensure the current_page is within bounds
return story_pages[current_page], Audio(data=audio_io.read(), autoplay=True), image_reply
# Create the Gradio Interface with styling
demo = gr.Interface(
fn=StorytellerGPT,
inputs=[
gr.Textbox("text", label="Child's Name"),
gr.Dropdown(["unicorn", "dragon", "wizard"], label="Choose a Character"),
gr.Dropdown(["kindness", "creativity", "bravery"], label="Choose a Lesson"),
gr.Textbox("text", label="Start the Story with"),
gr.Button("Next Page"),
],
outputs=["text", "audio", "image"],
title="πŸ“– Storytelling Magic",
description="A magical storyteller app for kids! Choose characters, add your name, and select the lesson you want to learn.",
live=True, # Enable live updates for CSS changes
css=f"""body {{
background-image: url('https://www.bing.com/images/create/a-castle-ai-metaverse-style/1-657576205c7146f2b7f2f8d1c552810f?id=dZs6kpD2HfmH4eojx%2bHjdA%3d%3d&view=detailv2&idpp=genimg&FORM=GCRIDP&mode=overlay');
background-size: cover;
background-position: center;
font-family: 'Comic Sans MS', cursive, sans-serif; /* Optional: Change the font */
}}""",
)
# Launch the Gradio Interface
demo.launch()