Spaces:

channelcorp
/

Ko-TTS-Arena

Running on CPU Upgrade

App Files Files Community

Ko-TTS-Arena Contributors commited on 7 days ago

Commit

f54c69b

1 Parent(s): 515ea95

feat: Upgrade Typecast to v3.0 API (ssfm-v30), add Jaesun & Jain voices, deactivate legacy GeumHee

Browse files

Files changed (3) hide show

models.py +20 -3
requirements.txt +0 -1
tts.py +37 -27

models.py CHANGED Viewed

@@ -641,15 +641,32 @@ def insert_initial_models():
             is_active=has_humelo,
             model_url="https://humelo.com/",
         ),
-        # Typecast TTS (한국어 특화) - API 키 있을 때만 활성화
         Model(
-            id="typecast-geumhee",
-            name="Typecast (GeumHee)",
             model_type=ModelType.TTS,
             is_open=False,
             is_active=has_typecast,
             model_url="https://typecast.ai/",
         ),
         # Gemini TTS (Google Cloud - 다국어 지원) - 서비스 계정 JSON 필요
         Model(
             id="gemini-tts-aoede",

             is_active=has_humelo,
             model_url="https://humelo.com/",
         ),
+        # Typecast TTS v3.0 (한국어 특화) - API 키 있을 때만 활성화
         Model(
+            id="typecast-jaesun",
+            name="Typecast v3 (재선)",
+            model_type=ModelType.TTS,
+            is_open=False,
+            is_active=has_typecast,
+            model_url="https://typecast.ai/",
+        ),
+        Model(
+            id="typecast-jain",
+            name="Typecast v3 (자인)",
             model_type=ModelType.TTS,
             is_open=False,
             is_active=has_typecast,
             model_url="https://typecast.ai/",
         ),
+        # Legacy Typecast - 비활성화 (v3.0으로 대체)
+        Model(
+            id="typecast-geumhee",
+            name="Typecast (GeumHee) [Legacy]",
+            model_type=ModelType.TTS,
+            is_open=False,
+            is_active=False,  # 비활성화
+            model_url="https://typecast.ai/",
+        ),
         # Gemini TTS (Google Cloud - 다국어 지원) - 서비스 계정 JSON 필요
         Model(
             id="gemini-tts-aoede",

requirements.txt CHANGED Viewed

@@ -14,5 +14,4 @@ huggingface-hub
 scipy
 numpy
 pydub
-typecast-python
 google-cloud-texttospeech

 scipy
 numpy
 pydub
 google-cloud-texttospeech

tts.py CHANGED Viewed

@@ -219,17 +219,27 @@ model_mapping = {
         "voice": "리아",
         "emotion": "neutral",
     },
-    # Typecast TTS (한국어 특화)
     "typecast-geumhee": {
         "provider": "typecast",
-        "voice_id": "tc_5c789c337ad86500073a02cd",
-        "model": "ssfm-v21",
     },
-    # Legacy Typecast ID kept for backward compatibility (routes to GeumHee)
     "typecast-jaeyi": {
         "provider": "typecast",
-        "voice_id": "tc_5c789c337ad86500073a02cd",
-        "model": "ssfm-v21",
     },
     # Gemini TTS (Google Cloud - 다국어 지원)
     "gemini-tts-aoede": {
@@ -435,31 +445,31 @@ def predict_humelo_tts(text: str, voice: str = "리아", emotion: str = "neutral
         return f.name
-def predict_typecast_tts(text: str, voice_id: str = "tc_612ed01c7eb720fddd3ddedf", model: str = "ssfm-v21") -> str:
-    """Typecast TTS API 호출"""
     api_key = TYPECAST_API_KEY
     if not api_key:
         raise ValueError("TYPECAST_API_KEY 환경 변수가 설정되지 않았습니다.")
-    try:
-        from typecast.client import Typecast
-        from typecast.models import TTSRequest
-        cli = Typecast(api_key=api_key)
-        response = cli.text_to_speech(TTSRequest(
-            text=text,
-            model=model,
-            voice_id=voice_id,
-        ))
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
-            f.write(response.audio_data)
-            return f.name
-    except ImportError:
-        raise ValueError("typecast-python 패키지가 설치되지 않았습니다. pip install typecast-python")
-    except Exception as e:
-        raise ValueError(f"Typecast TTS API 오류: {str(e)}")
 def predict_gemini_tts(text: str, voice: str = "Aoede", model: str = "gemini-2.5-flash-tts") -> str:

         "voice": "리아",
         "emotion": "neutral",
     },
+    # Typecast TTS v3.0 (한국어 특화) - 새 보이스
+    "typecast-jaesun": {
+        "provider": "typecast",
+        "voice_id": "tc_684a7a1446e2a628b5b07230",  # 재선
+        "model": "ssfm-v30",
+    },
+    "typecast-jain": {
+        "provider": "typecast",
+        "voice_id": "tc_6809c111e5e8c73f8a0237b2",  # 자인
+        "model": "ssfm-v30",
+    },
+    # Legacy Typecast IDs - routes to new Jaesun voice
     "typecast-geumhee": {
         "provider": "typecast",
+        "voice_id": "tc_684a7a1446e2a628b5b07230",
+        "model": "ssfm-v30",
     },
     "typecast-jaeyi": {
         "provider": "typecast",
+        "voice_id": "tc_684a7a1446e2a628b5b07230",
+        "model": "ssfm-v30",
     },
     # Gemini TTS (Google Cloud - 다국어 지원)
     "gemini-tts-aoede": {
         return f.name
+def predict_typecast_tts(text: str, voice_id: str, model: str = "ssfm-v30") -> str:
+    """Typecast TTS API 호출 (v3.0 experiment API)"""
     api_key = TYPECAST_API_KEY
     if not api_key:
         raise ValueError("TYPECAST_API_KEY 환경 변수가 설정되지 않았습니다.")
+    url = "https://api.typecast.ai/experiment/text-to-speech"
+    payload = {
+        "voice_id": voice_id,
+        "text": text,
+        "model": model
+    }
+    headers = {
+        "X-API-KEY": api_key,
+        "Content-Type": "application/json"
+    }
+    response = requests.post(url, headers=headers, json=payload, timeout=60)
+    response.raise_for_status()
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
+        f.write(response.content)
+        return f.name
 def predict_gemini_tts(text: str, voice: str = "Aoede", model: str = "gemini-2.5-flash-tts") -> str: