Spaces:
Configuration error
Configuration error
| #!/usr/bin/env python3 | |
| import sys | |
| sys.path.append('third_party/Matcha-TTS') | |
| try: | |
| from cosyvoice.cli.cosyvoice import CosyVoice | |
| from cosyvoice.utils.file_utils import load_wav | |
| import torchaudio | |
| print("Loading CosyVoice model...") | |
| cosyvoice = CosyVoice('pretrained_models/CosyVoice-300M-SFT', load_jit=False, load_trt=False, fp16=False) | |
| print("Available speakers:") | |
| speakers = cosyvoice.list_available_spks() | |
| for spk in speakers[:5]: | |
| print(f" - {spk}") | |
| print("\nGenerating speech...") | |
| # Generate a simple test | |
| for i, j in enumerate(cosyvoice.inference_sft('你好,我是通义生成式语音大模型', '中文女', stream=False)): | |
| torchaudio.save(f'test_output_{i}.wav', j['tts_speech'], cosyvoice.sample_rate) | |
| print(f"Saved test_output_{i}.wav") | |
| print("Test successful!") | |
| except Exception as e: | |
| print(f"Error: {e}") | |
| import traceback | |
| traceback.print_exc() |