Spaces:

ResembleAI
/

Chatterbox_TTS_Demo

Runtime error

App Files Files Community

ollieollie commited on 14 days ago

Commit

5aefb03

1 Parent(s): efe64f8

add text norm + watermark

Browse files

Files changed (46) hide show

chatterbox/src/chatterbox/__init__.py +2 -1
chatterbox/src/chatterbox/__pycache__/__init__.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/__pycache__/tts.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/__pycache__/vc.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/__init__.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/const.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/decoder.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/f0_predictor.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/flow.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/flow_matching.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/hifigan.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/s3gen.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/__pycache__/xvector.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/matcha/__pycache__/decoder.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/matcha/__pycache__/flow_matching.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/matcha/__pycache__/transformer.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/__init__.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/activation.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/attention.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/convolution.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/embedding.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/encoder_layer.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/positionwise_feed_forward.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/subsampling.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/upsample_encoder.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/utils/__pycache__/class_utils.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/utils/__pycache__/mask.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3gen/utils/__pycache__/mel.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3tokenizer/__pycache__/__init__.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/s3tokenizer/__pycache__/s3tokenizer.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/__pycache__/__init__.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/__pycache__/llama_configs.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/__pycache__/t3.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/inference/__pycache__/alignment_stream_analyzer.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/inference/__pycache__/t3_hf_backend.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/modules/__pycache__/cond_enc.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/modules/__pycache__/learned_pos_emb.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/modules/__pycache__/perceiver.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/t3/modules/__pycache__/t3_config.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/tokenizers/__pycache__/__init__.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/tokenizers/__pycache__/tokenizer.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/voice_encoder/__pycache__/__init__.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/voice_encoder/__pycache__/config.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/voice_encoder/__pycache__/melspec.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/models/voice_encoder/__pycache__/voice_encoder.cpython-311.pyc +0 -0
chatterbox/src/chatterbox/tts.py +44 -0

chatterbox/src/chatterbox/__init__.py CHANGED Viewed

	@@ -1 +1,2 @@
1	- from .tts import ChatterboxTTS


1	+ from .tts import ChatterboxTTS
2	+ from .vc import ChatterboxVC

chatterbox/src/chatterbox/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (275 Bytes). View file

chatterbox/src/chatterbox/__pycache__/tts.cpython-311.pyc ADDED Viewed

Binary file (12.5 kB). View file

chatterbox/src/chatterbox/__pycache__/vc.cpython-311.pyc ADDED Viewed

Binary file (4.9 kB). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (294 Bytes). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/const.cpython-311.pyc ADDED Viewed

Binary file (190 Bytes). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/decoder.cpython-311.pyc ADDED Viewed

Binary file (16.9 kB). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/f0_predictor.cpython-311.pyc ADDED Viewed

Binary file (2.7 kB). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/flow.cpython-311.pyc ADDED Viewed

Binary file (13.7 kB). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/flow_matching.cpython-311.pyc ADDED Viewed

Binary file (13.3 kB). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/hifigan.cpython-311.pyc ADDED Viewed

Binary file (26.3 kB). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/s3gen.cpython-311.pyc ADDED Viewed

Binary file (13.7 kB). View file

chatterbox/src/chatterbox/models/s3gen/__pycache__/xvector.cpython-311.pyc ADDED Viewed

Binary file (24 kB). View file

chatterbox/src/chatterbox/models/s3gen/matcha/__pycache__/decoder.cpython-311.pyc ADDED Viewed

Binary file (21.3 kB). View file

chatterbox/src/chatterbox/models/s3gen/matcha/__pycache__/flow_matching.cpython-311.pyc ADDED Viewed

Binary file (6.46 kB). View file

chatterbox/src/chatterbox/models/s3gen/matcha/__pycache__/transformer.cpython-311.pyc ADDED Viewed

Binary file (14.7 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (190 Bytes). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/activation.cpython-311.pyc ADDED Viewed

Binary file (3.58 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/attention.cpython-311.pyc ADDED Viewed

Binary file (15.7 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/convolution.cpython-311.pyc ADDED Viewed

Binary file (5.54 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/embedding.cpython-311.pyc ADDED Viewed

Binary file (17.3 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/encoder_layer.cpython-311.pyc ADDED Viewed

Binary file (11.2 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/positionwise_feed_forward.cpython-311.pyc ADDED Viewed

Binary file (6.24 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/subsampling.cpython-311.pyc ADDED Viewed

Binary file (18.9 kB). View file

chatterbox/src/chatterbox/models/s3gen/transformer/__pycache__/upsample_encoder.cpython-311.pyc ADDED Viewed

Binary file (15.6 kB). View file

chatterbox/src/chatterbox/models/s3gen/utils/__pycache__/class_utils.cpython-311.pyc ADDED Viewed

Binary file (1.93 kB). View file

chatterbox/src/chatterbox/models/s3gen/utils/__pycache__/mask.cpython-311.pyc ADDED Viewed

Binary file (6.25 kB). View file

chatterbox/src/chatterbox/models/s3gen/utils/__pycache__/mel.cpython-311.pyc ADDED Viewed

Binary file (4.05 kB). View file

chatterbox/src/chatterbox/models/s3tokenizer/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (806 Bytes). View file

chatterbox/src/chatterbox/models/s3tokenizer/__pycache__/s3tokenizer.cpython-311.pyc ADDED Viewed

Binary file (7.94 kB). View file

chatterbox/src/chatterbox/models/t3/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (218 Bytes). View file

chatterbox/src/chatterbox/models/t3/__pycache__/llama_configs.cpython-311.pyc ADDED Viewed

Binary file (1.34 kB). View file

chatterbox/src/chatterbox/models/t3/__pycache__/t3.cpython-311.pyc ADDED Viewed

Binary file (13.4 kB). View file

chatterbox/src/chatterbox/models/t3/inference/__pycache__/alignment_stream_analyzer.cpython-311.pyc ADDED Viewed

Binary file (7.08 kB). View file

chatterbox/src/chatterbox/models/t3/inference/__pycache__/t3_hf_backend.cpython-311.pyc ADDED Viewed

Binary file (4.82 kB). View file

chatterbox/src/chatterbox/models/t3/modules/__pycache__/cond_enc.cpython-311.pyc ADDED Viewed

Binary file (5.37 kB). View file

chatterbox/src/chatterbox/models/t3/modules/__pycache__/learned_pos_emb.cpython-311.pyc ADDED Viewed

Binary file (2.54 kB). View file

chatterbox/src/chatterbox/models/t3/modules/__pycache__/perceiver.cpython-311.pyc ADDED Viewed

Binary file (12.6 kB). View file

chatterbox/src/chatterbox/models/t3/modules/__pycache__/t3_config.cpython-311.pyc ADDED Viewed

Binary file (1.27 kB). View file

chatterbox/src/chatterbox/models/tokenizers/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (242 Bytes). View file

chatterbox/src/chatterbox/models/tokenizers/__pycache__/tokenizer.cpython-311.pyc ADDED Viewed

Binary file (3.1 kB). View file

chatterbox/src/chatterbox/models/voice_encoder/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (281 Bytes). View file

chatterbox/src/chatterbox/models/voice_encoder/__pycache__/config.cpython-311.pyc ADDED Viewed

Binary file (859 Bytes). View file

chatterbox/src/chatterbox/models/voice_encoder/__pycache__/melspec.cpython-311.pyc ADDED Viewed

Binary file (3.59 kB). View file

chatterbox/src/chatterbox/models/voice_encoder/__pycache__/voice_encoder.cpython-311.pyc ADDED Viewed

Binary file (18.7 kB). View file

chatterbox/src/chatterbox/tts.py CHANGED Viewed

@@ -28,6 +28,48 @@ def change_pace(speech_tokens: torch.Tensor, pace: float):
     return speech_tokens
 @dataclass
 class Conditionals:
     """
@@ -176,6 +218,8 @@ class ChatterboxTTS:
                 emotion_adv=exaggeration * torch.ones(1, 1, 1),
             ).to(device=self.device)
         text_tokens = self.tokenizer.text_to_tokens(text).to(self.device)
         sot = self.t3.hp.start_text_token

     return speech_tokens
+def punc_norm(text: str) -> str:
+    """
+        Quick cleanup func for punctuation from LLMs or
+        containing chars not seen often in the dataset
+    """
+    if len(text) == 0:
+        return "You need to add some text for me to talk."
+    # Capitalise first letter
+    if text[0].islower():
+        text = text[0].upper() + text[1:]
+    # Remove multiple space chars
+    text = " ".join(text.split())
+    # Replace uncommon/llm punc
+    punc_to_replace = [
+        ("...", ", "),
+        ("…", ", "),
+        (":", ","),
+        (" - ", ", "),
+        (";", ", "),
+        ("—", "-"),
+        ("–", "-"),
+        (" ,", ","),
+        ("“", "\""),
+        ("”", "\""),
+        ("‘", "'"),
+        ("’", "'"),
+    ]
+    for old_char_sequence, new_char in punc_to_replace:
+        text = text.replace(old_char_sequence, new_char)
+    # Add full stop if no ending punc
+    text = text.rstrip(" ")
+    sentence_enders = {".", "!", "?", "-", ","}
+    if not any(text.endswith(p) for p in sentence_enders):
+        text += "."
+    return text
 @dataclass
 class Conditionals:
     """
                 emotion_adv=exaggeration * torch.ones(1, 1, 1),
             ).to(device=self.device)
+        # Norm and tokenize text
+        text = punc_norm(text)
         text_tokens = self.tokenizer.text_to_tokens(text).to(self.device)
         sot = self.t3.hp.start_text_token