Hhhh / tts_api.py
Kfjjdjdjdhdhd's picture
Upload 26 files
7b74407 verified
from flask import jsonify, send_file, request
from main import *
import torch, torchaudio, uuid, io, base64
def text_to_speech_func(text, output_path="output_audio.wav"):
if tts_model is None: return {"error": "TTS model not initialized."}
input_tokens = tts_model.tokenizer(text, return_tensors="pt", padding=True).to(device)
with torch.no_grad(): audio_output = tts_model(input_tokens['input_ids'])
torchaudio.save(output_path, audio_output.cpu(), 16000); return output_path
def tts_api(text):
output_file = text_to_speech_func(text)
if isinstance(output_file, dict) and "error" in output_file: return {"error": output_file["error"]}
with open(output_file, 'rb') as f: audio_content = f.read()
audio_base64 = base64.b64encode(audio_content).decode('utf-8'); os.remove(output_file); return {"audio_base64": audio_base64, "mimetype": "audio/wav"}