Spaces:

tanbw
/

CosyVoice

Configuration error

CosyVoice commited on Aug 1, 2024

Commit

9504c3f

1 Parent(s): 553244b

fix flow matching training for zero shot inference

Files changed (1) hide show

cosyvoice/flow/flow.py CHANGED Viewed

@@ -12,6 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import logging
 from typing import Dict, Optional
 import torch
 import torch.nn as nn
@@ -77,6 +78,11 @@ class MaskedDiffWithXvec(torch.nn.Module):
         # get conditions
         conds = torch.zeros(feat.shape, device=token.device)
         conds = conds.transpose(1, 2)
         mask = (~make_pad_mask(feat_len)).to(h)

 # See the License for the specific language governing permissions and
 # limitations under the License.
 import logging
+import random
 from typing import Dict, Optional
 import torch
 import torch.nn as nn
         # get conditions
         conds = torch.zeros(feat.shape, device=token.device)
+        for i, j in enumerate(feat_len):
+            if random.random() < 0.5:
+                continue
+            index = random.randint(0, int(0.3 * j))
+            conds[i, :index] = feat[i, :index]
         conds = conds.transpose(1, 2)
         mask = (~make_pad_mask(feat_len)).to(h)