Spaces:

ILLUME-MLLM
/

ILLUME_plus-3b

Sleeping

App Files Files Community

huangrh9 commited on May 30

Commit

b28f99d

verified ·

1 Parent(s): 54731a8

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -8

app.py CHANGED Viewed

@@ -21,7 +21,8 @@ logging.getLogger("httpx").setLevel(logging.WARNING)
 import gradio as gr
-from conversation import default_conversation, conv_templates, SeparatorStyle
 # --- Global Variables and Model Loading ---
 model = None  # Global variable to hold the loaded ILLUME model
@@ -569,8 +570,9 @@ title_markdown = """
       <li><strong>3.</strong> Click the 🖼️ <strong>Generate</strong> for image generation and image editing.</li>
       <li><strong>5.</strong> (Optional) Enable Diffusion Decoder for image super resolution decoding.
       <li><strong>4.</strong> Adjust generation parameters if needed.
-        <br/><strong>💡 Tip 1:</strong> For better image generation quality, we recommend setting <code>top_k = 2048</code>.
-        <br/><strong>💡 Tip 2:</strong> For diffusion decoder, CFG scale of 1.5 or 2.0 is enough.
       </li>
     </ul>
   </div>
@@ -897,15 +899,15 @@ def build_demo(embed_mode):
 if __name__ == "__main__":
     parser = argparse.ArgumentParser()
     # --- Add arguments for ILLUME configs and checkpoints ---
-    parser.add_argument("--model_name", type=str, default="illume-unified-mllm/illume_plus-qwen-2_5-3b-hf",
                         help="Name for builder.")
-    parser.add_argument("--torch_dtype", type=str, default='fp32', choices=['fp32', 'bf16', 'fp16'],
                         help="Computation data type.")
-    parser.add_argument("--diffusion_decoder_path", type=str, default='illume-unified-mllm/dualvitok_sdxl_decoder.pt',
-                        help="Path to Diffusion Decoder checkpoint (.pt). Required if using diffusion.")
-    parser.add_argument("--tokenizer_path", type=str, default='illume-unified-mllm/dualvitok',
                         help="Path to Tokenizer config file (e.g., tokenizer_config.py).")
     # --- End ILLUME arguments ---

 import gradio as gr
+from illume.conversation import default_conversation, conv_templates, SeparatorStyle
+# from conversation import default_conversation, conv_templates, SeparatorStyle
 # --- Global Variables and Model Loading ---
 model = None  # Global variable to hold the loaded ILLUME model
       <li><strong>3.</strong> Click the 🖼️ <strong>Generate</strong> for image generation and image editing.</li>
       <li><strong>5.</strong> (Optional) Enable Diffusion Decoder for image super resolution decoding.
       <li><strong>4.</strong> Adjust generation parameters if needed.
+        <br/><strong>💡 Tip 1:</strong> For better image generation quality, we recommend setting <code>temperature = 1.0</code>, <code>top_k = 2048</code>, <code>top_p = 1.0</code>, <code>llm_cfg = 2.0</code>.
+        <br/><strong>💡 Tip 2:</strong> For better image editing quality, we recommend setting <code>temperature = 0.7</code>, <code>top_k = 512</code>, <code>top_p = 0.8</code>, <code>llm_cfg = 1.5</code>.
+        <br/><strong>💡 Tip 3:</strong> For diffusion decoder, CFG scale of 1.5 or 2.0 is enough.
       </li>
     </ul>
   </div>
 if __name__ == "__main__":
     parser = argparse.ArgumentParser()
     # --- Add arguments for ILLUME configs and checkpoints ---
+    parser.add_argument("--model_name", type=str, default="ILLUME-MLLM/illume_plus-qwen-2_5-3b-hf",
                         help="Name for builder.")
+    parser.add_argument("--torch_dtype", type=str, default='bf16', choices=['fp32', 'bf16', 'fp16'],
                         help="Computation data type.")
+    parser.add_argument("--diffusion_decoder_path", type=str, default='ILLUME-MLLM/dualvitok_sdxl_decoder',
+                        help="Path to Diffusion Decoder checkpoint. Required if using diffusion.")
+    parser.add_argument("--tokenizer_path", type=str, default='ILLUME-MLLM/dualvitok',
                         help="Path to Tokenizer config file (e.g., tokenizer_config.py).")
     # --- End ILLUME arguments ---