Spaces:

mcp-tools
/

Qwen-Image

Running on Zero

App Files Files Community

evalstate commited on 6 days ago

Commit

7c163af

1 Parent(s): 5b0cdfc

update sizes, remove unused checkbox update description, change inference default steps

Browse files

Files changed (1) hide show

app.py +14 -38

app.py CHANGED Viewed

@@ -19,44 +19,28 @@ pipe = QwenImagePipeline.from_pretrained("Qwen/Qwen-Image", torch_dtype=dtype).t
 # --- UI Constants and Helpers ---
 MAX_SEED = np.iinfo(np.int32).max
-def ensure_divisible_by_16(value):
-    """Ensures a value is divisible by 16 by rounding to nearest multiple."""
-    return (value + 8) // 16 * 16
 def get_image_size(aspect_ratio):
     """Converts aspect ratio string to width, height tuple."""
-    # Handle 16:9 size variants
-    if aspect_ratio == "16:9_large":
-        return 1664, 928
-    elif aspect_ratio == "16:9_three_quarter":
-        # 75% of full size, ensuring divisibility by 16
-        width = ensure_divisible_by_16(int(1664 * 0.75))
-        height = ensure_divisible_by_16(int(928 * 0.75))
-        return width, height  # 1248, 704
-    elif aspect_ratio == "16:9_half":
-        # 50% of full size
-        return 832, 464
-    # Keep original aspect ratios as fallback
-    elif aspect_ratio == "1:1":
-        return 664, 664
     elif aspect_ratio == "16:9":
-        return 832, 464
     elif aspect_ratio == "9:16":
-        return 464, 832
     elif aspect_ratio == "4:3":
-        return 736, 552
     elif aspect_ratio == "3:4":
-        return 552, 736
     elif aspect_ratio == "3:2":
-        return 792, 528
     elif aspect_ratio == "2:3":
-        return 528, 792
     else:
-        # Default to 16:9_half if something goes wrong
-        return 832, 464
 # --- Main Inference Function ---
-@spaces.GPU(duration=90)
 def generate_image(
     prompt,
     seed=42,
@@ -65,7 +49,6 @@ def generate_image(
     negative_prompt="text, watermark, copyright, blurry, low resolution",
     guidance_scale=4.0,
     num_inference_steps=30,
-#    prompt_enhance=True,
     progress=gr.Progress(track_tqdm=True),
 ):
     """
@@ -86,11 +69,7 @@ def generate_image(
     # Set up the generator for reproducibility
     generator = torch.Generator(device=device).manual_seed(seed)
-#    magic_prompt = "Ultra HD, 4K, cinematic composition"
- #   prompt = prompt + " " + magic_prompt
     print(f"Calling pipeline with prompt: '{prompt}'")
-#    if prompt_enhance:
- #       prompt = rewrite(prompt)
     print(f"Actual Prompt: '{prompt}'")
     print(f"Negative Prompt: '{negative_prompt}'")
     print(f"Seed: {seed}, Size: {width}x{height}, Steps: {num_inference_steps}, Guidance: {guidance_scale}")
@@ -132,16 +111,14 @@ css = """
 with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
         gr.Markdown('<img src="https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-Image/qwen_image_logo.png" alt="Qwen-Image Logo" width="400" style="display: block; margin: 0 auto;">')
-        gr.Markdown("[Learn more](https://github.com/QwenLM/Qwen-Image) about the Qwen-Image series. Try on [Qwen Chat](https://chat.qwen.ai/), or [download model](https://huggingface.co/Qwen/Qwen-Image) to run locally with ComfyUI or diffusers. <br /> **This version does not run the prompt polisher, but does suffix the 'Magic Prompt' and improve parameter descriptions**.")
         with gr.Row():
             prompt = gr.Text(
                 label="Prompt",
                 show_label=False,
                 placeholder="Enter your prompt",
                 container=False,
-            )
             run_button = gr.Button("Run", scale=0, variant="primary")
         result = gr.Image(label="Result", show_label=False, type="pil")
@@ -170,7 +147,6 @@ with gr.Blocks(css=css) as demo:
                     choices=["16:9_large", "16:9_three_quarter", "16:9_half"],
                     value="16:9_half",
                 )
-                prompt_enhance = gr.Checkbox(label="Prompt Enhance", value=True)
             with gr.Row():
                 guidance_scale = gr.Slider(
@@ -186,7 +162,7 @@ with gr.Blocks(css=css) as demo:
                     minimum=1,
                     maximum=50,
                     step=1,
-                    value=30,
                 )
         gr.Examples(examples=examples, inputs=[prompt], outputs=[result, seed], fn=generate_image, cache_examples=False)

 # --- UI Constants and Helpers ---
 MAX_SEED = np.iinfo(np.int32).max
 def get_image_size(aspect_ratio):
     """Converts aspect ratio string to width, height tuple."""
+    if aspect_ratio == "1:1":
+        return 1328, 1328
     elif aspect_ratio == "16:9":
+        return 1664, 928
     elif aspect_ratio == "9:16":
+        return 928, 1664
     elif aspect_ratio == "4:3":
+        return 1472, 1104
     elif aspect_ratio == "3:4":
+        return 1104, 1472
     elif aspect_ratio == "3:2":
+        return 1584, 1056
     elif aspect_ratio == "2:3":
+        return 1056, 1584
     else:
+        # Default to 1:1 if something goes wrong
+        return 1328, 1328
 # --- Main Inference Function ---
+@spaces.GPU(duration=40)
 def generate_image(
     prompt,
     seed=42,
     negative_prompt="text, watermark, copyright, blurry, low resolution",
     guidance_scale=4.0,
     num_inference_steps=30,
     progress=gr.Progress(track_tqdm=True),
 ):
     """
     # Set up the generator for reproducibility
     generator = torch.Generator(device=device).manual_seed(seed)
     print(f"Calling pipeline with prompt: '{prompt}'")
     print(f"Actual Prompt: '{prompt}'")
     print(f"Negative Prompt: '{negative_prompt}'")
     print(f"Seed: {seed}, Size: {width}x{height}, Steps: {num_inference_steps}, Guidance: {guidance_scale}")
 with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
         gr.Markdown('<img src="https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-Image/qwen_image_logo.png" alt="Qwen-Image Logo" width="400" style="display: block; margin: 0 auto;">')
+        gr.Markdown("[Learn more](https://github.com/QwenLM/Qwen-Image) about the Qwen-Image series. Try on [Qwen Chat](https://chat.qwen.ai/), or [download model](https://huggingface.co/Qwen/Qwen-Image) to run locally with ComfyUI or diffusers. <br /> **This version does not include the 'prompt polisher', and uses 20 inference steps by default to target ~30s generation times**.")
         with gr.Row():
             prompt = gr.Text(
                 label="Prompt",
                 show_label=False,
                 placeholder="Enter your prompt",
                 container=False,
+            )
             run_button = gr.Button("Run", scale=0, variant="primary")
         result = gr.Image(label="Result", show_label=False, type="pil")
                     choices=["16:9_large", "16:9_three_quarter", "16:9_half"],
                     value="16:9_half",
                 )
             with gr.Row():
                 guidance_scale = gr.Slider(
                     minimum=1,
                     maximum=50,
                     step=1,
+                    value=20,
                 )
         gr.Examples(examples=examples, inputs=[prompt], outputs=[result, seed], fn=generate_image, cache_examples=False)