SynthScope

Running

App Files Files Community

Ifeanyi commited on Jun 16

Commit

ed356db

verified ·

1 Parent(s): 7f8cddd

Update synthscope.py

Browse files

Files changed (1) hide show

synthscope.py +59 -27

synthscope.py CHANGED Viewed

@@ -15,7 +15,7 @@ google_search_tool = Tool(
 model_id = "gemini-2.0-flash"
-def GoogleSearchImageGen(prompt, image_style, voice):
     def wave_file(filename, pcm, channels=1, rate=24000, sample_width=2):
         with wave.open(filename, "wb") as wf:
             wf.setnchannels(channels)
@@ -23,18 +23,6 @@ def GoogleSearchImageGen(prompt, image_style, voice):
             wf.setframerate(rate)
             wf.writeframes(pcm)
-    # define style-specific prompts
-    style_prompts = {
-        "Comic": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a comic book-style image.",
-        "Cartoon": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a cartoon-style image.",
-        "3D": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a Pixar-style 3D image.",
-        "Anime": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates an Anime-style image.",
-        "Ghibli": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a Ghibli-style image.",
-        "Victorian": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a Victorian-era image.",
-        "Movie": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a Movie-style image.",
-        "Star Wars": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a Star Wars-style image.",
-        "Marvel": f"{prompt}. Convert the search result into a well-crafted text-to-image prompt that generates a Marvel-style image."
-    }
     # define audio output voice
     select_voice = {
@@ -50,15 +38,6 @@ def GoogleSearchImageGen(prompt, image_style, voice):
         "Gacrux": "Gacrux"
     }
-    # Check if the image_style is supported
-    if image_style in style_prompts:
-        image_gen_prompt = style_prompts[image_style]
-    else:
-        return "Invalid image style", None, None
-    # Initialize variables to avoid UnboundLocalError
-    search_result = ""
-    image = None
     try:
         # Get search result to be displayed to the user
@@ -71,22 +50,75 @@ def GoogleSearchImageGen(prompt, image_style, voice):
             )
         )
         # Extract search result
         for each in response.candidates[0].content.parts:
             if each.text:
                 search_result += each.text
         # Generate audio from search result
         audio_resp = client.models.generate_content(
             model="gemini-2.5-flash-preview-tts",
-            contents=search_result,
             config=types.GenerateContentConfig(
                 response_modalities=["AUDIO"],
                 speech_config=types.SpeechConfig(
                     voice_config=types.VoiceConfig(
                         prebuilt_voice_config=types.PrebuiltVoiceConfig(
-                            voice_name=select_voice[voice],
                         )
                     )
                 ),
@@ -134,6 +166,6 @@ def GoogleSearchImageGen(prompt, image_style, voice):
     except Exception as e:
         print(f"Error occurred: {e}")
         # Return default values in case of error
-        return search_result or "No search result available", None, None
-    return search_result, image, audio_output_file

 model_id = "gemini-2.0-flash"
+def GoogleSearchImageGen(prompt, image_style, voices, language):
     def wave_file(filename, pcm, channels=1, rate=24000, sample_width=2):
         with wave.open(filename, "wb") as wf:
             wf.setnchannels(channels)
             wf.setframerate(rate)
             wf.writeframes(pcm)
     # define audio output voice
     select_voice = {
         "Gacrux": "Gacrux"
     }
     try:
         # Get search result to be displayed to the user
             )
         )
+        # Initialize variables to avoid UnboundLocalError
+        search_result = ""
+        image = None
         # Extract search result
         for each in response.candidates[0].content.parts:
             if each.text:
                 search_result += each.text
+        # define style-specific prompts
+        style_prompts = {
+            "Comic": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a comic book-style image.",
+            "Cartoon": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a cartoon-style image.",
+            "3D": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Pixar-style 3D image.",
+            "Anime": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates an Anime-style image.",
+            "Ghibli": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Ghibli-style image.",
+            "Victorian": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Victorian-era image.",
+            "Movie": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Movie-style image.",
+            "Star Wars": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Star Wars-style image.",
+            "Marvel": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Marvel-style image.",
+            "Disney": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Disney-style image.",
+            "Van Gogh": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Van Gogh-style image.",
+            "Picasso": f"Convert the {search_result} into a well-crafted text-to-image prompt that generates a Picasso-style image"
+        }
+        # Check if the image_style is supported
+        if image_style in style_prompts:
+            image_gen_prompt = style_prompts[image_style]
+        else:
+            return "Invalid image style", None, None
+        # define translation options
+        translation_prompt = {
+            "English": f"Read out the {search_result}",
+            "Spanish": f"Translate {search_result} into Spanish. Return only the translated text.",
+            "French": f"Translate {search_result} into French. Return only the translated text.",
+            "German": f"Translate {search_result} into German. Return only the translated text.",
+            "Italian": f"Translate {search_result} into Italian. Return only the translated text.",
+            "Japanese": f"Translate {search_result} into Japanese. Return only the translated text.",
+            "Tamil": f"Translate {search_result} into Tamil. Return only the translated text.",
+            "Arabic": f"Translate {search_result} into Arabic. Return only the translated text.",
+            "Russian": f"Translate {search_result} into Russian. Return only the translated text.",
+            "Portuguese": f"Translate {search_result} Portuguese. Return only the translated text.",
+            "Dutch": f"Translate {search_result} into Dutch. Return only the translated text.",
+            "Thai": f"Translate {search_result} into Thai. Return only the translated text.",
+            "Turkish": f"Translate {search_result} into Turkish. Return only the translated text.",
+            "Romanian": f"Translate {search_result} into Romanian. Return only the translated text.",
+            "Polish": f"Translate {search_result} into Romanian. Return only the translated text."
+        }
+        # updated search result
+        trans_resp = client.models.generate_content(
+            model=model_id,
+            contents= translation_prompt[language]
+        )
         # Generate audio from search result
         audio_resp = client.models.generate_content(
             model="gemini-2.5-flash-preview-tts",
+            contents=trans_resp.text,
             config=types.GenerateContentConfig(
                 response_modalities=["AUDIO"],
                 speech_config=types.SpeechConfig(
                     voice_config=types.VoiceConfig(
                         prebuilt_voice_config=types.PrebuiltVoiceConfig(
+                            voice_name=select_voice[voices],
                         )
                     )
                 ),
     except Exception as e:
         print(f"Error occurred: {e}")
         # Return default values in case of error
+        return trans_resp.text or "No search result available", None, None
+    return trans_resp.text, image, audio_output_file