Spaces:

ResembleAI
/

Chatterbox_TTS_Demo

Runtime error

App Files Files Community

ollieollie commited on May 13

Commit

b6843d1

1 Parent(s): 78c3bd0

rename to chatterbox

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

chatterbox/src/chatterbox/__init__.py +1 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/__init__.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/const.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/decoder.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/f0_predictor.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/flow.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/flow_matching.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/hifigan.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/decoder.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/flow_matching.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/text_encoder.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/transformer.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/s3gen.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/__init__.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/activation.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/attention.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/convolution.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/embedding.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/encoder_layer.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/positionwise_feed_forward.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/subsampling.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/upsample_encoder.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/utils/class_utils.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/utils/mask.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/utils/mel.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/xvector.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3tokenizer/__init__.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/s3tokenizer/s3tokenizer.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/__init__.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/inference/alignment_stream_analyzer.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/inference/t3_hf_backend.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/llama_configs.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/cond_enc.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/learned_pos_emb.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/perceiver.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/t3_config.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/t3/t3.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/tokenizers/__init__.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/tokenizers/tokenizer.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/__init__.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/config.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/melspec.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/voice_encoder.py +0 -0
{orator/src/orator → chatterbox/src/chatterbox}/tts.py +4 -4
{orator/src/orator → chatterbox/src/chatterbox}/vc.py +4 -4
orator/src/orator.egg-info/PKG-INFO +0 -17
orator/src/orator.egg-info/SOURCES.txt +0 -52
orator/src/orator.egg-info/dependency_links.txt +0 -1
orator/src/orator.egg-info/requires.txt +0 -10
orator/src/orator.egg-info/top_level.txt +0 -1

chatterbox/src/chatterbox/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ from .tts import ChatterboxTTS

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/__init__.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/const.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/decoder.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/f0_predictor.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/flow.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/flow_matching.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/hifigan.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/decoder.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/flow_matching.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/text_encoder.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/matcha/transformer.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/s3gen.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/__init__.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/activation.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/attention.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/convolution.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/embedding.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/encoder_layer.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/positionwise_feed_forward.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/subsampling.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/transformer/upsample_encoder.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/utils/class_utils.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/utils/mask.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/utils/mel.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3gen/xvector.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3tokenizer/__init__.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/s3tokenizer/s3tokenizer.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/__init__.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/inference/alignment_stream_analyzer.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/inference/t3_hf_backend.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/llama_configs.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/cond_enc.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/learned_pos_emb.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/perceiver.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/modules/t3_config.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/t3/t3.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/tokenizers/__init__.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/tokenizers/tokenizer.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/__init__.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/config.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/melspec.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/models/voice_encoder/voice_encoder.py RENAMED Viewed

File without changes

{orator/src/orator → chatterbox/src/chatterbox}/tts.py RENAMED Viewed

@@ -14,7 +14,7 @@ from .models.voice_encoder import VoiceEncoder
 from .models.t3.modules.cond_enc import T3Cond
-REPO_ID = "ResembleAI/Orator"
 def change_pace(speech_tokens: torch.Tensor, pace: float):
@@ -68,7 +68,7 @@ class Conditionals:
         return cls(T3Cond(**kwargs['t3']), kwargs['gen'])
-class OratorTTS:
     ENC_COND_LEN = 6 * S3_SR
     DEC_COND_LEN = 10 * S3GEN_SR
@@ -90,7 +90,7 @@ class OratorTTS:
         self.conds = conds
     @classmethod
-    def from_local(cls, ckpt_dir, device) -> 'OratorTTS':
         ckpt_dir = Path(ckpt_dir)
         ve = VoiceEncoder()
@@ -122,7 +122,7 @@ class OratorTTS:
         return cls(t3, s3gen, ve, tokenizer, device, conds=conds)
     @classmethod
-    def from_pretrained(cls, device) -> 'OratorTTS':
         for fpath in ["ve.pt", "t3.pt", "s3gen.pt", "tokenizer.json", "conds.pt"]:
             local_path = hf_hub_download(repo_id=REPO_ID, filename=fpath)

 from .models.t3.modules.cond_enc import T3Cond
+REPO_ID = "ResembleAI/chatterbox"
 def change_pace(speech_tokens: torch.Tensor, pace: float):
         return cls(T3Cond(**kwargs['t3']), kwargs['gen'])
+class ChatterboxTTS:
     ENC_COND_LEN = 6 * S3_SR
     DEC_COND_LEN = 10 * S3GEN_SR
         self.conds = conds
     @classmethod
+    def from_local(cls, ckpt_dir, device) -> 'ChatterboxTTS':
         ckpt_dir = Path(ckpt_dir)
         ve = VoiceEncoder()
         return cls(t3, s3gen, ve, tokenizer, device, conds=conds)
     @classmethod
+    def from_pretrained(cls, device) -> 'ChatterboxTTS':
         for fpath in ["ve.pt", "t3.pt", "s3gen.pt", "tokenizer.json", "conds.pt"]:
             local_path = hf_hub_download(repo_id=REPO_ID, filename=fpath)

{orator/src/orator → chatterbox/src/chatterbox}/vc.py RENAMED Viewed

@@ -8,10 +8,10 @@ from .models.s3tokenizer import S3_SR
 from .models.s3gen import S3GEN_SR, S3Gen
-REPO_ID = "ResembleAI/Orator"
-class OratorVC:
     ENC_COND_LEN = 6 * S3_SR
     DEC_COND_LEN = 10 * S3GEN_SR
@@ -33,7 +33,7 @@ class OratorVC:
             }
     @classmethod
-    def from_local(cls, ckpt_dir, device) -> 'OratorVC':
         ckpt_dir = Path(ckpt_dir)
         ref_dict = None
         if (builtin_voice := ckpt_dir / "conds.pt").exists():
@@ -49,7 +49,7 @@ class OratorVC:
         return cls(s3gen, device, ref_dict=ref_dict)
     @classmethod
-    def from_pretrained(cls, device) -> 'OratorVC':
         for fpath in ["s3gen.pt", "conds.pt"]:
             local_path = hf_hub_download(repo_id=REPO_ID, filename=fpath)

 from .models.s3gen import S3GEN_SR, S3Gen
+REPO_ID = "ResembleAI/chatterbox"
+class ChatterboxVC:
     ENC_COND_LEN = 6 * S3_SR
     DEC_COND_LEN = 10 * S3GEN_SR
             }
     @classmethod
+    def from_local(cls, ckpt_dir, device) -> 'ChatterboxVC':
         ckpt_dir = Path(ckpt_dir)
         ref_dict = None
         if (builtin_voice := ckpt_dir / "conds.pt").exists():
         return cls(s3gen, device, ref_dict=ref_dict)
     @classmethod
+    def from_pretrained(cls, device) -> 'ChatterboxVC':
         for fpath in ["s3gen.pt", "conds.pt"]:
             local_path = hf_hub_download(repo_id=REPO_ID, filename=fpath)

orator/src/orator.egg-info/PKG-INFO DELETED Viewed

@@ -1,17 +0,0 @@
-Metadata-Version: 2.4
-Name: orator
-Version: 0.1
-Description-Content-Type: text/markdown
-Requires-Dist: numpy==1.26.0
-Requires-Dist: resampy==0.4.3
-Requires-Dist: librosa==0.10.0
-Requires-Dist: s3tokenizer
-Requires-Dist: torch==2.6.0
-Requires-Dist: torchaudio==2.6.0
-Requires-Dist: transformers==4.46.3
-Requires-Dist: diffusers==0.29.0
-Requires-Dist: omegaconf==2.3.0
-Requires-Dist: conformer==0.3.2
-# orator
-Open source TTS model

orator/src/orator.egg-info/SOURCES.txt DELETED Viewed

@@ -1,52 +0,0 @@
-README.md
-pyproject.toml
-src/orator/__init__.py
-src/orator/model_checkpoints.py
-src/orator/tts.py
-src/orator.egg-info/PKG-INFO
-src/orator.egg-info/SOURCES.txt
-src/orator.egg-info/dependency_links.txt
-src/orator.egg-info/requires.txt
-src/orator.egg-info/top_level.txt
-src/orator/models/s3gen/__init__.py
-src/orator/models/s3gen/const.py
-src/orator/models/s3gen/decoder.py
-src/orator/models/s3gen/f0_predictor.py
-src/orator/models/s3gen/flow.py
-src/orator/models/s3gen/flow_matching.py
-src/orator/models/s3gen/hifigan.py
-src/orator/models/s3gen/s3gen.py
-src/orator/models/s3gen/xvector.py
-src/orator/models/s3gen/matcha/decoder.py
-src/orator/models/s3gen/matcha/flow_matching.py
-src/orator/models/s3gen/matcha/text_encoder.py
-src/orator/models/s3gen/matcha/transformer.py
-src/orator/models/s3gen/transformer/__init__.py
-src/orator/models/s3gen/transformer/activation.py
-src/orator/models/s3gen/transformer/attention.py
-src/orator/models/s3gen/transformer/convolution.py
-src/orator/models/s3gen/transformer/embedding.py
-src/orator/models/s3gen/transformer/encoder_layer.py
-src/orator/models/s3gen/transformer/positionwise_feed_forward.py
-src/orator/models/s3gen/transformer/subsampling.py
-src/orator/models/s3gen/transformer/upsample_encoder.py
-src/orator/models/s3gen/utils/class_utils.py
-src/orator/models/s3gen/utils/mask.py
-src/orator/models/s3gen/utils/mel.py
-src/orator/models/s3tokenizer/__init__.py
-src/orator/models/s3tokenizer/s3tokenizer.py
-src/orator/models/t3/__init__.py
-src/orator/models/t3/llama_configs.py
-src/orator/models/t3/t3.py
-src/orator/models/t3/inference/t3_hf_backend.py
-src/orator/models/t3/modules/cond_enc.py
-src/orator/models/t3/modules/learned_pos_emb.py
-src/orator/models/t3/modules/perceiver.py
-src/orator/models/t3/modules/t3_config.py
-src/orator/models/tokenizers/__init__.py
-src/orator/models/tokenizers/tokenizer.py
-src/orator/models/voice_encoder/__init__.py
-src/orator/models/voice_encoder/voice_encoder.py
-src/orator/transforms/spectrogram.py
-src/orator/transforms/syn_transforms.py
-src/orator/transforms/webrtc.py

orator/src/orator.egg-info/dependency_links.txt DELETED Viewed

	@@ -1 +0,0 @@
1	-

orator/src/orator.egg-info/requires.txt DELETED Viewed

@@ -1,10 +0,0 @@
-numpy==1.26.0
-resampy==0.4.3
-librosa==0.10.0
-s3tokenizer
-torch==2.6.0
-torchaudio==2.6.0
-transformers==4.46.3
-diffusers==0.29.0
-omegaconf==2.3.0
-conformer==0.3.2

orator/src/orator.egg-info/top_level.txt DELETED Viewed

	@@ -1 +0,0 @@
1	- orator