Spaces:

mcp-tools
/

Qwen-Image

Running on Zero

App Files Files Community

evalstate commited on 5 days ago

Commit

8c9766e

1 Parent(s): ac783de

add size options for output testing

Browse files

Files changed (1) hide show

app.py +24 -8

app.py CHANGED Viewed

@@ -19,9 +19,25 @@ pipe = QwenImagePipeline.from_pretrained("Qwen/Qwen-Image", torch_dtype=dtype).t
 # --- UI Constants and Helpers ---
 MAX_SEED = np.iinfo(np.int32).max
 def get_image_size(aspect_ratio):
     """Converts aspect ratio string to width, height tuple."""
-    if aspect_ratio == "1:1":
         return 664, 664
     elif aspect_ratio == "16:9":
         return 832, 464
@@ -36,8 +52,8 @@ def get_image_size(aspect_ratio):
     elif aspect_ratio == "2:3":
         return 528, 792
     else:
-        # Default to 1:1 if something goes wrong
-        return 664, 664
 # --- Main Inference Function ---
 @spaces.GPU(duration=30)
@@ -70,8 +86,8 @@ def generate_image(
     # Set up the generator for reproducibility
     generator = torch.Generator(device=device).manual_seed(seed)
-    magic_prompt = "Ultra HD, 4K, cinematic composition"
-    prompt = prompt + " " + magic_prompt
     print(f"Calling pipeline with prompt: '{prompt}'")
 #    if prompt_enhance:
  #       prompt = rewrite(prompt)
@@ -150,9 +166,9 @@ with gr.Blocks(css=css) as demo:
             with gr.Row():
                 aspect_ratio = gr.Radio(
-                    label="Aspect ratio (width:height)",
-                    choices=["1:1", "16:9", "9:16", "4:3", "3:4", "3:2", "2:3"],
-                    value="16:9",
                 )
                 prompt_enhance = gr.Checkbox(label="Prompt Enhance", value=True)

 # --- UI Constants and Helpers ---
 MAX_SEED = np.iinfo(np.int32).max
+def ensure_divisible_by_16(value):
+    """Ensures a value is divisible by 16 by rounding to nearest multiple."""
+    return (value + 8) // 16 * 16
 def get_image_size(aspect_ratio):
     """Converts aspect ratio string to width, height tuple."""
+    # Handle 16:9 size variants
+    if aspect_ratio == "16:9_large":
+        return 1664, 928
+    elif aspect_ratio == "16:9_three_quarter":
+        # 75% of full size, ensuring divisibility by 16
+        width = ensure_divisible_by_16(int(1664 * 0.75))
+        height = ensure_divisible_by_16(int(928 * 0.75))
+        return width, height  # 1248, 704
+    elif aspect_ratio == "16:9_half":
+        # 50% of full size
+        return 832, 464
+    # Keep original aspect ratios as fallback
+    elif aspect_ratio == "1:1":
         return 664, 664
     elif aspect_ratio == "16:9":
         return 832, 464
     elif aspect_ratio == "2:3":
         return 528, 792
     else:
+        # Default to 16:9_half if something goes wrong
+        return 832, 464
 # --- Main Inference Function ---
 @spaces.GPU(duration=30)
     # Set up the generator for reproducibility
     generator = torch.Generator(device=device).manual_seed(seed)
+#    magic_prompt = "Ultra HD, 4K, cinematic composition"
+ #   prompt = prompt + " " + magic_prompt
     print(f"Calling pipeline with prompt: '{prompt}'")
 #    if prompt_enhance:
  #       prompt = rewrite(prompt)
             with gr.Row():
                 aspect_ratio = gr.Radio(
+                    label="Image Size (16:9 aspect ratio)",
+                    choices=["16:9_large", "16:9_three_quarter", "16:9_half"],
+                    value="16:9_half",
                 )
                 prompt_enhance = gr.Checkbox(label="Prompt Enhance", value=True)