|
from fastapi import Body, HTTPException |
|
from fastapi.responses import FileResponse, StreamingResponse |
|
from pydantic import BaseModel |
|
|
|
from modules.api.Api import APIManager |
|
from modules.api.impl.handler.SSMLHandler import SSMLHandler |
|
from modules.api.impl.model.audio_model import AdjustConfig, AudioFormat |
|
from modules.api.impl.model.chattts_model import InferConfig |
|
from modules.api.impl.model.enhancer_model import EnhancerConfig |
|
|
|
|
|
class SSMLRequest(BaseModel): |
|
ssml: str |
|
format: AudioFormat = "mp3" |
|
|
|
|
|
batch_size: int = 4 |
|
|
|
|
|
eos: str = "[uv_break]" |
|
|
|
spliter_thr: int = 100 |
|
|
|
enhancer: EnhancerConfig = EnhancerConfig() |
|
adjuster: AdjustConfig = AdjustConfig() |
|
|
|
|
|
async def synthesize_ssml_api( |
|
request: SSMLRequest = Body( |
|
..., description="JSON body with SSML string and format" |
|
) |
|
): |
|
try: |
|
ssml = request.ssml |
|
format = request.format.lower() |
|
batch_size = request.batch_size |
|
eos = request.eos |
|
spliter_thr = request.spliter_thr |
|
enhancer = request.enhancer |
|
adjuster = request.adjuster |
|
|
|
if batch_size < 1: |
|
raise HTTPException( |
|
status_code=400, detail="Batch size must be greater than 0." |
|
) |
|
|
|
if spliter_thr < 50: |
|
raise HTTPException( |
|
status_code=400, detail="Spliter threshold must be greater than 50." |
|
) |
|
|
|
if not ssml or ssml == "": |
|
raise HTTPException(status_code=400, detail="SSML content is required.") |
|
|
|
if format not in ["mp3", "wav"]: |
|
raise HTTPException( |
|
status_code=400, detail="Format must be 'mp3' or 'wav'." |
|
) |
|
|
|
infer_config = InferConfig( |
|
batch_size=batch_size, |
|
spliter_threshold=spliter_thr, |
|
eos=eos, |
|
) |
|
adjust_config = adjuster |
|
enhancer_config = enhancer |
|
|
|
handler = SSMLHandler( |
|
ssml_content=ssml, |
|
infer_config=infer_config, |
|
adjust_config=adjust_config, |
|
enhancer_config=enhancer_config, |
|
) |
|
|
|
buffer = handler.enqueue_to_buffer(format=request.format) |
|
|
|
mime_type = f"audio/{format}" |
|
if format == AudioFormat.mp3: |
|
mime_type = "audio/mpeg" |
|
return StreamingResponse(buffer, media_type=mime_type) |
|
|
|
except Exception as e: |
|
import logging |
|
|
|
logging.exception(e) |
|
|
|
if isinstance(e, HTTPException): |
|
raise e |
|
else: |
|
raise HTTPException(status_code=500, detail=str(e)) |
|
|
|
|
|
def setup(api_manager: APIManager): |
|
api_manager.post("/v1/ssml", response_class=FileResponse)(synthesize_ssml_api) |
|
|