Spaces:

tanbw
/

CosyVoice

Running on Zero

CosyVoice commited on Sep 5

Commit

e141634

•

1 Parent(s): 11eacb8

remove unnecessary code

Files changed (2) hide show

cosyvoice/flow/flow.py CHANGED Viewed

@@ -113,7 +113,7 @@ class MaskedDiffWithXvec(torch.nn.Module):
         # concat text and prompt_text
         token_len1, token_len2 = prompt_token.shape[1], token.shape[1]
         token, token_len = torch.concat([prompt_token, token], dim=1), prompt_token_len + token_len
-        mask = (~make_pad_mask(token_len)).to(embedding.dtype).unsqueeze(-1).to(embedding)
         token = self.input_embedding(torch.clamp(token, min=0)) * mask
         # text encode

         # concat text and prompt_text
         token_len1, token_len2 = prompt_token.shape[1], token.shape[1]
         token, token_len = torch.concat([prompt_token, token], dim=1), prompt_token_len + token_len
+        mask = (~make_pad_mask(token_len)).unsqueeze(-1).to(embedding)
         token = self.input_embedding(torch.clamp(token, min=0)) * mask
         # text encode

cosyvoice/flow/flow_matching.py CHANGED Viewed

@@ -14,8 +14,6 @@
 import torch
 import torch.nn.functional as F
 from matcha.models.components.flow_matching import BASECFM
-import onnxruntime as ort
-import numpy as np
 class ConditionalCFM(BASECFM):
     def __init__(self, in_channels, cfm_params, n_spks=1, spk_emb_dim=64, estimator: torch.nn.Module = None):

 import torch
 import torch.nn.functional as F
 from matcha.models.components.flow_matching import BASECFM
 class ConditionalCFM(BASECFM):
     def __init__(self, in_channels, cfm_params, n_spks=1, spk_emb_dim=64, estimator: torch.nn.Module = None):