Odysseus v1.0

2026-06-17 10:15:27 -04:00 · 2026-05-31 23:58:26 +09:00
commit e5c99a5eee
421 changed files with 271349 additions and 0 deletions
@@ -0,0 +1,87 @@
+# routes/tts_routes.py
+"""
+TTS API routes — multi-provider (local Kokoro, API endpoint, browser).
+"""
+
+from fastapi import APIRouter, HTTPException
+from fastapi.responses import Response
+from pydantic import BaseModel
+import logging
+
+logger = logging.getLogger(__name__)
+
+class TTSRequest(BaseModel):
+    text: str
+    format: str = "audio"  # "audio" or "base64"
+
+def setup_tts_routes(tts_service):
+    """Setup TTS routes with the provided TTS service"""
+    router = APIRouter(prefix="/api/tts", tags=["tts"])
+
+    @router.get("/stats")
+    async def get_tts_stats():
+        """Get TTS service statistics"""
+        try:
+            return tts_service.get_stats()
+        except Exception as e:
+            logger.error(f"Failed to get TTS stats: {e}")
+            raise HTTPException(status_code=500, detail=str(e))
+
+    @router.post("/synthesize")
+    async def synthesize_speech(request: TTSRequest):
+        """Synthesize speech from text"""
+        try:
+            if not tts_service.available:
+                raise HTTPException(
+                    status_code=503,
+                    detail={"message": "TTS service not available"}
+                )
+            
+            if request.format == "base64":
+                audio_b64 = tts_service.synthesize_to_base64(request.text)
+                if not audio_b64:
+                    raise HTTPException(
+                        status_code=500,
+                        detail={"message": "Synthesis failed"}
+                    )
+                return {"audio": audio_b64}
+            
+            else:  # audio format
+                audio_data = tts_service.synthesize(request.text)
+                if not audio_data:
+                    raise HTTPException(
+                        status_code=500,
+                        detail={"message": "Synthesis failed"}
+                    )
+                
+                # Detect format from magic bytes (MP3: ID3 tag or sync word ff e0+)
+                is_mp3 = audio_data[:3] == b'ID3' or (len(audio_data) >= 2 and audio_data[0] == 0xff and (audio_data[1] & 0xe0) == 0xe0)
+                mime = "audio/mpeg" if is_mp3 else "audio/wav"
+                return Response(
+                    content=audio_data,
+                    media_type=mime,
+                    headers={
+                        "Content-Disposition": "inline; filename=speech.mp3" if "mpeg" in mime else "inline; filename=speech.wav"
+                    }
+                )
+        
+        except HTTPException:
+            raise
+        except Exception as e:
+            logger.error(f"Synthesis error: {e}", exc_info=True)
+            raise HTTPException(
+                status_code=500,
+                detail={"message": f"Synthesis failed: {str(e)}"}
+            )
+
+    @router.post("/clear-cache")
+    async def clear_tts_cache():
+        """Clear TTS cache"""
+        try:
+            tts_service.clear_cache()
+            return {"success": True, "message": "Cache cleared"}
+        except Exception as e:
+            logger.error(f"Failed to clear cache: {e}")
+            raise HTTPException(status_code=500, detail=str(e))
+
+    return router