ByteMorpher-Demo

Running on Zero

App Files Files Community

bol commited on May 23

Commit

47dbef4

1 Parent(s): de42ae8

edit

Browse files

Files changed (5) hide show

.DS_Store +0 -0
app.py +45 -44
assets/0_camera_zoom/20486354.json +0 -3
assets/0_camera_zoom/20486354.png +0 -3
assets/0_camera_zoom/20486354_2.png +0 -3

.DS_Store CHANGED Viewed

Binary files a/.DS_Store and b/.DS_Store differ

app.py CHANGED Viewed

@@ -4,18 +4,17 @@ import spaces
 import os
 import numpy as np
 from PIL import Image
 from huggingface_hub import hf_hub_download
 from safetensors.torch import load_file
 from omegaconf import OmegaConf
 from src.flux.util import load_ae, load_clip, load_flow_model2, load_t5, tensor_to_pil_image
 from src.flux.xflux_pipeline import XFluxSampler
-from image_datasets.dataset import image_resize
-# ===== No CUDA/model initialization globally =====
 args = OmegaConf.load("inference_configs/inference.yaml")
 is_schnell = args.model_name == "flux-schnell"
 # sampler = None
 device = torch.device("cuda")
 dtype = torch.bfloat16
@@ -23,36 +22,39 @@ dit = load_flow_model2(args.model_name, device="cpu").to(device, dtype=dtype)
 vae = load_ae(args.model_name, device="cpu").to(device, dtype=dtype)
 t5 = load_t5(device="cpu", max_length=256 if is_schnell else 512).to(device, dtype=dtype)
 clip = load_clip("cpu").to(device, dtype=dtype)
-vae.requires_grad_(False)
-t5.requires_grad_(False)
-clip.requires_grad_(False)
-model_path = hf_hub_download(
-    repo_id="Boese0601/ByteMorpher",
-    filename="dit.safetensors",
-    use_auth_token=os.getenv("HF_TOKEN")
-)
-state_dict = load_file(model_path)
-dit.load_state_dict(state_dict)
-dit.eval()
-dit.to(device, dtype=dtype)
-sampler = XFluxSampler(
-    clip=clip,
-    t5=t5,
-    ae=vae,
-    model=dit,
-    device=device,
-    ip_loaded=False,
-    spatial_condition=False,
-    clip_image_processor=None,
-    image_encoder=None,
-    improj=None
-)
 #test push
 @spaces.GPU
 def generate(image: Image.Image, edit_prompt: str):
     # global sampler
     # device = torch.device("cuda")
     # dtype = torch.bfloat16
@@ -95,18 +97,17 @@ def generate(image: Image.Image, edit_prompt: str):
     img = torch.from_numpy((np.array(img) / 127.5) - 1)
     img = img.permute(2, 0, 1).unsqueeze(0).to(device, dtype=dtype)
-    with torch.no_grad():
-        result = sampler(
-            prompt=edit_prompt,
-            width=args.sample_width,
-            height=args.sample_height,
-            num_steps=args.sample_steps,
-            image_prompt=None,
-            true_gs=args.cfg_scale,
-            seed=args.seed,
-            ip_scale=args.ip_scale if args.use_ip else 1.0,
-            source_image=img if args.use_spatial_condition else None,
-        )
     return tensor_to_pil_image(result)
 def get_samples():

 import os
 import numpy as np
 from PIL import Image
 from huggingface_hub import hf_hub_download
 from safetensors.torch import load_file
 from omegaconf import OmegaConf
+from image_datasets.dataset import image_resize
 from src.flux.util import load_ae, load_clip, load_flow_model2, load_t5, tensor_to_pil_image
 from src.flux.xflux_pipeline import XFluxSampler
 args = OmegaConf.load("inference_configs/inference.yaml")
 is_schnell = args.model_name == "flux-schnell"
+'/home/user/app/assets/0_camera_zoom/20486354.png'
+'/home/user/app/assets/0_camera_zoom/20486354.png'
 # sampler = None
 device = torch.device("cuda")
 dtype = torch.bfloat16
 vae = load_ae(args.model_name, device="cpu").to(device, dtype=dtype)
 t5 = load_t5(device="cpu", max_length=256 if is_schnell else 512).to(device, dtype=dtype)
 clip = load_clip("cpu").to(device, dtype=dtype)
 #test push
 @spaces.GPU
 def generate(image: Image.Image, edit_prompt: str):
+    vae.requires_grad_(False)
+    t5.requires_grad_(False)
+    clip.requires_grad_(False)
+    model_path = hf_hub_download(
+        repo_id="Boese0601/ByteMorpher",
+        filename="dit.safetensors",
+        use_auth_token=os.getenv("HF_TOKEN")
+    )
+    state_dict = load_file(model_path)
+    dit.load_state_dict(state_dict)
+    dit.eval()
+    dit.to(device, dtype=dtype)
+    sampler = XFluxSampler(
+        clip=clip,
+        t5=t5,
+        ae=vae,
+        model=dit,
+        device=device,
+        ip_loaded=False,
+        spatial_condition=False,
+        clip_image_processor=None,
+        image_encoder=None,
+        improj=None
+    )
     # global sampler
     # device = torch.device("cuda")
     # dtype = torch.bfloat16
     img = torch.from_numpy((np.array(img) / 127.5) - 1)
     img = img.permute(2, 0, 1).unsqueeze(0).to(device, dtype=dtype)
+    result = sampler(
+        prompt=edit_prompt,
+        width=args.sample_width,
+        height=args.sample_height,
+        num_steps=args.sample_steps,
+        image_prompt=None,
+        true_gs=args.cfg_scale,
+        seed=args.seed,
+        ip_scale=args.ip_scale if args.use_ip else 1.0,
+        source_image=img if args.use_spatial_condition else None,
+    )
     return tensor_to_pil_image(result)
 def get_samples():

assets/0_camera_zoom/20486354.json DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7917201faf043e935ea4ddd94c7e570fe5ca51f8bed66ee4d4dabe480f8390b5
-size 1128

assets/0_camera_zoom/20486354.png DELETED Viewed

Git LFS Details

SHA256: b124690b006104dbde0b59fb88189cf27fb5ccb07d31bd86bb376f12e6c845b0
Pointer size: 128 Bytes
Size of remote file: 131 Bytes

assets/0_camera_zoom/20486354_2.png DELETED Viewed

Git LFS Details

SHA256: 122440474104f5e2cf739f5a4a8294d997abe90528737f384dc64d9860a05b9b
Pointer size: 128 Bytes
Size of remote file: 132 Bytes