Fix TTS: switch to 1.7B with ref_audio, speakable text on all lines

- Use 1.7B model (0.6B had tensor mismatch with cached prompts) - Speak endpoint uses ref_audio directly (not cached pkl) as fallback - Cache voice clone prompts in memory on startup - Add SpeakableText component: 🔊 icon on each p and li element - Remove old TTSReader sequential approach - Add global exception handler to TTS server - Fix profile localStorage caching - inference_mode + bf16 optimization Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-04-13 12:14:06 +00:00
parent 1088b23790
commit 20210830cf
6 changed files with 440 additions and 158 deletions
--- a/sundol-frontend/src/components/speakable-text.tsx
+++ b/sundol-frontend/src/components/speakable-text.tsx
@@ -0,0 +1,85 @@
+"use client";
+
+import { useState, useRef, useEffect } from "react";
+
+interface SpeakableProps {
+  children: React.ReactNode;
+  text: string;
+}
+
+let cachedProfileId: string | null = null;
+let profileChecked = false;
+
+export default function SpeakableText({ children, text }: SpeakableProps) {
+  const [playing, setPlaying] = useState(false);
+  const [loading, setLoading] = useState(false);
+  const [hasProfile, setHasProfile] = useState(false);
+  const audioRef = useRef<HTMLAudioElement | null>(null);
+
+  useEffect(() => {
+    if (profileChecked) {
+      setHasProfile(!!cachedProfileId);
+      return;
+    }
+    try {
+      const profiles = JSON.parse(localStorage.getItem("tts_profiles") || "[]");
+      if (profiles.length > 0) {
+        cachedProfileId = profiles[0].id;
+        setHasProfile(true);
+      }
+      profileChecked = true;
+    } catch {}
+  }, []);
+
+  const handleSpeak = async (e: React.MouseEvent) => {
+    e.preventDefault();
+    e.stopPropagation();
+
+    if (playing) {
+      audioRef.current?.pause();
+      setPlaying(false);
+      return;
+    }
+
+    if (!cachedProfileId || text.length < 5) return;
+
+    setLoading(true);
+    try {
+      const fd = new FormData();
+      fd.append("text", text);
+      fd.append("profile_id", cachedProfileId);
+      fd.append("language", "Korean");
+      const res = await fetch("/api/tts/speak", { method: "POST", body: fd });
+      if (!res.ok) { setLoading(false); return; }
+      const blob = await res.blob();
+      if (blob.size < 200) { setLoading(false); return; }
+
+      const url = URL.createObjectURL(blob);
+      const audio = new Audio(url);
+      audioRef.current = audio;
+      audio.onended = () => setPlaying(false);
+      setPlaying(true);
+      setLoading(false);
+      audio.play();
+    } catch {
+      setLoading(false);
+    }
+  };
+
+  if (!hasProfile || text.length < 5) return <>{children}</>;
+
+  return (
+    <>
+      {children}
+      <button
+        onClick={handleSpeak}
+        disabled={loading}
+        className="inline-flex items-center ml-1 text-[var(--color-text-muted)] hover:text-[var(--color-primary)] disabled:opacity-30 align-middle"
+        title={playing ? "중지" : "읽어주기"}
+        style={{ fontSize: "0.85em", verticalAlign: "middle", cursor: "pointer" }}
+      >
+        {loading ? "⏳" : playing ? "⏹" : "🔊"}
+      </button>
+    </>
+  );
+}