Spaces:
Configuration error
Configuration error
#\!/usr/bin/env python3 | |
import os | |
import sys | |
import time | |
print("=== CosyVoice2-0.5B English Test ===") | |
# Configurar ambiente | |
os.environ['HF_ENDPOINT'] = 'https://hf-mirror.com' | |
try: | |
from cosyvoice.cli.cosyvoice import CosyVoice | |
import torchaudio | |
# Usar o novo modelo CosyVoice2-0.5B | |
model_path = 'pretrained_models/CosyVoice2-0.5B' | |
# Verificar se o modelo existe | |
if not os.path.exists(model_path): | |
print(f"❌ Modelo ainda não baixado em {model_path}") | |
print("Aguarde o download terminar...") | |
sys.exit(1) | |
print("Carregando CosyVoice2-0.5B...") | |
start = time.time() | |
cosyvoice = CosyVoice(model_path, load_jit=False, load_trt=False, fp16=False) | |
print(f"✅ Modelo carregado em {time.time()-start:.1f}s") | |
# Teste em inglês | |
text = "Hello\! This is CosyVoice version two point five B. The new model has better streaming performance and improved pronunciation for English text to speech synthesis." | |
prompt_text = "Welcome to the demonstration of our advanced speech synthesis system." | |
print(f"\nTexto: {text}") | |
print("Gerando áudio...") | |
start = time.time() | |
output_file = "cosyvoice2_english_test.wav" | |
for i, j in enumerate(cosyvoice.inference_zero_shot(text, prompt_text, None, stream=False)): | |
torchaudio.save(output_file, j['tts_speech'], cosyvoice.sample_rate) | |
break | |
duration = time.time() - start | |
print(f"✅ Áudio gerado em {duration:.1f}s") | |
if os.path.exists(output_file): | |
size = os.path.getsize(output_file) / 1024 | |
print(f"📊 Arquivo: {output_file} ({size:.1f} KB)") | |
except Exception as e: | |
print(f"❌ Erro: {e}") | |
import traceback | |
traceback.print_exc() | |