Spaces:

Emmiq
/

EmmiSpace

Build error

SWivid commited on Jan 7

Commit

c34c0bb

1 Parent(s): f0a2045

fix no_ref_audio in cfm.py

Files changed (1) hide show

src/f5_tts/model/cfm.py CHANGED Viewed

@@ -142,6 +142,9 @@ class CFM(nn.Module):
             test_cond = F.pad(cond, (0, 0, cond_seq_len, max_duration - 2 * cond_seq_len), value=0.0)
         cond = F.pad(cond, (0, 0, 0, max_duration - cond_seq_len), value=0.0)
         cond_mask = F.pad(cond_mask, (0, max_duration - cond_mask.shape[-1]), value=False)
         cond_mask = cond_mask.unsqueeze(-1)
         step_cond = torch.where(
@@ -153,10 +156,6 @@ class CFM(nn.Module):
         else:  # save memory and speed up, as single inference need no mask currently
             mask = None
-        # test for no ref audio
-        if no_ref_audio:
-            cond = torch.zeros_like(cond)
         # neural ode
         def fn(t, x):

             test_cond = F.pad(cond, (0, 0, cond_seq_len, max_duration - 2 * cond_seq_len), value=0.0)
         cond = F.pad(cond, (0, 0, 0, max_duration - cond_seq_len), value=0.0)
+        if no_ref_audio:
+            cond = torch.zeros_like(cond)
         cond_mask = F.pad(cond_mask, (0, max_duration - cond_mask.shape[-1]), value=False)
         cond_mask = cond_mask.unsqueeze(-1)
         step_cond = torch.where(
         else:  # save memory and speed up, as single inference need no mask currently
             mask = None
         # neural ode
         def fn(t, x):