Spaces:
Running
Running
from flask import jsonify, send_file, request | |
from main import * | |
import torch, torchaudio, uuid, io, base64 | |
def text_to_speech_func(text, output_path="output_audio.wav"): | |
if tts_model is None: return {"error": "TTS model not initialized."} | |
input_tokens = tts_model.tokenizer(text, return_tensors="pt", padding=True).to(device) | |
with torch.no_grad(): audio_output = tts_model(input_tokens['input_ids']) | |
torchaudio.save(output_path, audio_output.cpu(), 16000); return output_path | |
def tts_api(text): | |
output_file = text_to_speech_func(text) | |
if isinstance(output_file, dict) and "error" in output_file: return {"error": output_file["error"]} | |
with open(output_file, 'rb') as f: audio_content = f.read() | |
audio_base64 = base64.b64encode(audio_content).decode('utf-8'); os.remove(output_file); return {"audio_base64": audio_base64, "mimetype": "audio/wav"} | |