Image2Network

Sleeping

App Files Files Community

Ifeanyi commited on May 11

Commit

edf6410

verified ·

1 Parent(s): 3315de8

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -41

app.py CHANGED Viewed

@@ -1,46 +1,57 @@
-import google.generativeai as genai
-from typing import Union, IO
-import gradio as gr
-import numpy as np
-import PIL.Image
 import os
-api_key = os.getenv("GEMINI_API_KEY")
-genai.configure(api_key = api_key)
-def ImageStory(image: Union[np.ndarray, str, IO]) -> str:
-    """
-    Writes a short story about the uploaded image.
-    Args:
-        image: The image being uploaded. It can be a NumPy array, file path, or file-like object.
-    Returns:
-        A short story about the uploaded image.
-    """
-    # load model
-    model = genai.GenerativeModel("gemini-1.5-flash")
-    # check image file and convert to a PIL image
-    if isinstance(image, np.ndarray):
-        img = PIL.Image.fromarray(image)
-    else:
-        img = PIL.Image.open(image)
-    response = model.generate_content(["write a short story about the image", img])
-    return response.text
-app = gr.Interface(ImageStory,
-                   inputs = gr.Image(label = "Image"),
-                   outputs = gr.Text(label = "Story"),
-                   examples = ["rubiks cube.jpg", "giraffe.jpg", "street.jpg"],
-                   title = "Image To Story",
-                   theme = "patrickosornio/my_theme1")
 if __name__ == "__main__":
     app.launch(mcp_server = True)

+from google import genai
+from google.genai import types
+from PIL import Image
+from io import BytesIO
+import base64
 import os
+def generate_image(prompt):
+  """
+  Transforms text into an image.
+  Args:
+      prompt: A natural language instruction that is used to generate an image.
+  Returns:
+        An image.
+  """
+  api_key = os.getenv("GEMINI_API_KEY")
+  client = genai.Client(api_key=api_key)
+  prompt = tuple(prompt)
+  response = client.models.generate_content(
+    model="gemini-2.0-flash-preview-image-generation",
+    contents=prompt,
+    config=types
+    .GenerateContentConfig(
+      response_modalities=['TEXT', 'IMAGE']
+    )
+  )
+  for part in response.candidates[0].content.parts:
+    if part.text is not None:
+      pass
+    elif part.inline_data is not None:
+      image = Image.open(BytesIO((part.inline_data.data)))
+      # image.save('gemini-native-image.png')
+      # display(image)
+  return image
+# build gradio interface
+app = gr.Interface(fn = generate_image,
+                   inputs = gr.Text(label="Prompt",placeholder="Type your prompt here. . ."),
+                   outputs = gr.Image(label="Generated Image"),
+                   title="Gemini Image Generator",
+                   examples=["A 3D rendering of a little black girl wearing a colorful dress and smiling broadly at the camera",
+                             "Disney and Pixar-style playful bunny skipping about in a garden full of carrots and lettuce",
+                             "A black female superhero with braided hair flying over a over an active volcano with a fiery red sky",
+                             "A black jazz musician playing his saxophone and surrounded by colorful musical notes."])
+# launch application
 if __name__ == "__main__":
     app.launch(mcp_server = True)