szeandlinkProject_Testing

Sleeping

App Files Files Community

Szeyu commited on May 2

Commit

890cd41

verified ·

1 Parent(s): fc42b63

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -14

app.py CHANGED Viewed

@@ -22,12 +22,18 @@ captioner, storyer, tts = load_pipelines()
 def clean_generated_story(raw_story: str) -> str:
     """
     Cleans the generated story by:
-    1. Removing digits.
-    2. Removing words that are likely random letter combinations based on having no vowels.
-    3. Removing single-letter words unless they are allowed (such as 'a' or 'I').
     """
-    # Remove all digits using regex
-    story_without_numbers = re.sub(r'\d+', '', raw_story)
     vowels = set('aeiouAEIOU')
@@ -40,11 +46,11 @@ def clean_generated_story(raw_story: str) -> str:
             return False
         return True
-    # Split the story into words, apply filtering, and recombine into a clean story
     words = story_without_numbers.split()
     filtered_words = [word for word in words if is_valid_word(word)]
-    # Optionally, you can trim the clean story to a certain word count
     clean_story = " ".join(filtered_words[:100])
     return clean_story
@@ -63,8 +69,7 @@ def get_story(caption: str) -> str:
     Takes a caption and returns a funny, bright, and playful story targeted toward young children.
     """
     prompt = (
-        f"Write a funny and playful story for young children"
-        f"precisely centered on this scene {caption}\nStory:"
         f"mention the exact place, location or venue within {caption}. "
         f"Make the story magical and exciting."
     )
@@ -85,12 +90,12 @@ def get_story(caption: str) -> str:
 def generate_audio(story: str) -> str:
     """
-    Converts a text story into speech audio and returns the file path for the audio.
     """
     chunks = textwrap.wrap(story, width=200)
     audio = np.concatenate([tts(chunk)["audio"].squeeze() for chunk in chunks])
-    # Save audio to a temporary file
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_file:
         sf.write(temp_file.name, audio, tts.model.config.sampling_rate)
         temp_file_path = temp_file.name
@@ -98,8 +103,10 @@ def generate_audio(story: str) -> str:
 def generate_content(image):
     """
-    Pipeline that takes an image, generates a caption, a story based on that caption,
-    and produces an audio file from the story.
     """
     caption = get_caption(image)
     story = get_story(caption)
@@ -125,4 +132,4 @@ if st.button("✨ Make My Story! ✨"):
             st.audio(audio_path, format="audio/wav")
             os.remove(audio_path)
     else:
-        st.warning("Please upload a picture first! 📸")

 def clean_generated_story(raw_story: str) -> str:
     """
     Cleans the generated story by:
+    1. Removing URLs.
+    2. Removing digits.
+    3. Removing words likely to be random letter combinations based on having no vowels.
+    4. Removing single-letter words unless allowed (such as 'a' or 'I').
     """
+    # Remove URLs starting with http://, https://, or www.
+    no_urls = re.sub(r'\b(?:https?://|www\.)\S+\b', '', raw_story)
+    # Remove domain names without protocol (e.g., erskybooks.com)
+    no_urls = re.sub(r'\b\w+\.(com|net|org|co\.uk|ca\.us|me)\b', '', no_urls)
+    # Remove all digits
+    story_without_numbers = re.sub(r'\d+', '', no_urls)
     vowels = set('aeiouAEIOU')
             return False
         return True
+    # Split the cleaned text into words, filter them, and reassemble
     words = story_without_numbers.split()
     filtered_words = [word for word in words if is_valid_word(word)]
+    # Trim the cleaned story to the first 100 words (optional)
     clean_story = " ".join(filtered_words[:100])
     return clean_story
     Takes a caption and returns a funny, bright, and playful story targeted toward young children.
     """
     prompt = (
+        f"Write a funny and playful story for young children precisely centered on this scene {caption}\nStory: "
         f"mention the exact place, location or venue within {caption}. "
         f"Make the story magical and exciting."
     )
 def generate_audio(story: str) -> str:
     """
+    Converts the text story into speech audio and returns the file path for the audio.
     """
     chunks = textwrap.wrap(story, width=200)
     audio = np.concatenate([tts(chunk)["audio"].squeeze() for chunk in chunks])
+    # Save the audio to a temporary file and return its path.
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_file:
         sf.write(temp_file.name, audio, tts.model.config.sampling_rate)
         temp_file_path = temp_file.name
 def generate_content(image):
     """
+    Pipeline function that:
+    - Generates a caption from the uploaded image.
+    - Uses the caption to generate a story.
+    - Converts the story to speech audio.
     """
     caption = get_caption(image)
     story = get_story(caption)
             st.audio(audio_path, format="audio/wav")
             os.remove(audio_path)
     else:
+        st.warning("Please upload a picture first! 📸")