크롤링 복구: Chrome CDP를 PM2 sundol-chrome로 상시화

Chrome 136+가 기본 프로필 디렉토리에서 원격 디버깅(CDP)을 거부하여 4월 13일 이후 웹크롤링 3차 폴백/유튜브 자막 추출이 전부 실패하던 문제 해결. - 프로필을 non-default 디렉토리(~/.config/google-chrome-cdp)로 이동해 로그인 세션 유지한 채 CDP 허용 - start-chrome.sh 신규: 기존 Chrome 정리 + stale lock 제거 후 --remote-debugging-port=9222 --remote-debugging-address=127.0.0.1 로 기동 - ecosystem.config.cjs: sundol-chrome PM2 앱 추가 (수동 실행 금지, PM2 통일) ※ frontend script의 /usr/local/bin/node 변경은 이전 작업분이 함께 포함됨 - PlaywrightBrowserService: CDP_URL을 127.0.0.1로 고정 (IPv6 ::1 해석 함정 제거) Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Fix TTS: switch to 1.7B with ref_audio, speakable text on all lines
2026-05-18 01:06:58 +00:00 · 2026-04-13 12:14:06 +00:00 · 2026-04-13 07:34:18 +00:00
20 changed files with 2193 additions and 124 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -68,3 +68,6 @@ oracle_data/
 # ========================
 .claude/
 cookies.txt
+audio-uploads/
+voice-profiles/
+*.wav
--- a/ecosystem.config.cjs
+++ b/ecosystem.config.cjs
@@ -1,5 +1,14 @@
 module.exports = {
  apps: [
+    {
+      name: "sundol-chrome",
+      script: "./start-chrome.sh",
+      interpreter: "/bin/bash",
+      cwd: "/home/opc/sundol",
+      env: {
+        DISPLAY: ":1",
+      },
+    },
    {
      name: "sundol-backend",
      script: "./start-backend.sh",
@@ -12,7 +21,7 @@ module.exports = {
    },
    {
      name: "sundol-frontend",
-      script: "node",
+      script: "/usr/local/bin/node",
      args: "sundol-frontend/.next/standalone/server.js",
      cwd: "/home/opc/sundol",
      env: {
--- a/start-chrome.sh
+++ b/start-chrome.sh
@@ -0,0 +1,35 @@
+#!/bin/bash
+# 사용자 Chrome을 CDP 디버깅 포트(9222)로 기동한다.
+# PM2(sundol-chrome)가 관리하는 전용 스크립트이므로 수동 실행 금지.
+# 봇 판정 우회를 위해 사용자 로그인 세션이 담긴 기존 프로필을 그대로 사용한다.
+set -u
+
+export DISPLAY=:1
+PROFILE_DIR="/home/opc/.config/google-chrome-cdp"
+DEBUG_PORT=9222
+
+# 1) 동일 프로필을 쓰는 기존 Chrome 종료.
+#    같은 user-data-dir로 Chrome이 이미 떠 있으면 새 인스턴스는
+#    디버깅 포트를 열지 못하고 기존 인스턴스에 명령만 전달하고 끝난다.
+pkill -TERM -f "/opt/google/chrome/chrome" 2>/dev/null || true
+for _ in $(seq 1 10); do
+  pgrep -f "/opt/google/chrome/chrome" >/dev/null 2>&1 || break
+  sleep 1
+done
+pkill -KILL -f "/opt/google/chrome/chrome" 2>/dev/null || true
+sleep 1
+
+# 2) 비정상 종료로 남은 stale 싱글톤 락 정리.
+rm -f "$PROFILE_DIR/SingletonLock" \
+      "$PROFILE_DIR/SingletonCookie" \
+      "$PROFILE_DIR/SingletonSocket" 2>/dev/null || true
+
+# 3) Chrome 기동. exec로 foreground 유지 → PM2 fork 모드가 프로세스를 추적.
+#    --remote-debugging-address=127.0.0.1 로 IPv4 바인딩을 명시한다.
+exec /usr/bin/google-chrome \
+  --user-data-dir="$PROFILE_DIR" \
+  --remote-debugging-port="$DEBUG_PORT" \
+  --remote-debugging-address=127.0.0.1 \
+  --no-first-run \
+  --no-default-browser-check \
+  --start-maximized
--- a/sundol-backend/src/main/java/com/sundol/controller/AuthController.java
+++ b/sundol-backend/src/main/java/com/sundol/controller/AuthController.java
@@ -45,11 +45,18 @@ public class AuthController {
    }

    @PostMapping("/refresh")
-    public Mono<ResponseEntity<LoginResponse>> refresh(ServerHttpRequest request, ServerHttpResponse response) {
+    public Mono<ResponseEntity<LoginResponse>> refresh(
+            ServerHttpRequest request, ServerHttpResponse response,
+            @RequestBody(required = false) Map<String, String> body) {
+        // 1차: body에서 refreshToken
+        String refreshToken = (body != null) ? body.get("refreshToken") : null;
+        // 2차: cookie에서 refreshToken
+        if (refreshToken == null || refreshToken.isBlank()) {
            HttpCookie cookie = request.getCookies().getFirst("refreshToken");
-        String refreshToken = cookie != null ? cookie.getValue() : null;
+            refreshToken = cookie != null ? cookie.getValue() : null;
+        }

-        if (refreshToken == null) {
+        if (refreshToken == null || refreshToken.isBlank()) {
            return Mono.just(ResponseEntity.status(401).build());
        }

--- a/sundol-backend/src/main/java/com/sundol/controller/NoteController.java
+++ b/sundol-backend/src/main/java/com/sundol/controller/NoteController.java
@@ -0,0 +1,561 @@
+package com.sundol.controller;
+
+import com.sundol.repository.CategoryRepository;
+import com.sundol.repository.NoteRepository;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+import org.springframework.beans.factory.annotation.Value;
+import org.springframework.http.ResponseEntity;
+import org.springframework.http.codec.multipart.FilePart;
+import org.springframework.security.core.annotation.AuthenticationPrincipal;
+import org.springframework.web.bind.annotation.*;
+import reactor.core.publisher.Mono;
+import reactor.core.scheduler.Schedulers;
+
+import java.io.IOException;
+import java.net.URI;
+import java.net.http.HttpClient;
+import java.net.http.HttpRequest;
+import java.net.http.HttpResponse;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.util.Base64;
+import java.util.List;
+import java.util.Map;
+
+@RestController
+@RequestMapping("/api/notes")
+public class NoteController {
+
+    private static final Logger log = LoggerFactory.getLogger(NoteController.class);
+    private static final Path AUDIO_DIR = Path.of(System.getProperty("user.dir"), "audio-uploads");
+    private static final HttpClient httpClient = HttpClient.newHttpClient();
+
+    @Value("${openrouter.api-key:}")
+    private String openRouterApiKey;
+
+    @Value("${openrouter.model:google/gemini-2.5-flash}")
+    private String openRouterModel;
+
+    private final NoteRepository noteRepository;
+    private final CategoryRepository categoryRepository;
+    private final com.sundol.service.OciGenAiService genAiService;
+
+    public NoteController(NoteRepository noteRepository, CategoryRepository categoryRepository,
+                          com.sundol.service.OciGenAiService genAiService) {
+        this.noteRepository = noteRepository;
+        this.categoryRepository = categoryRepository;
+        this.genAiService = genAiService;
+        try { Files.createDirectories(AUDIO_DIR); } catch (Exception ignored) {}
+    }
+
+    @GetMapping
+    public Mono<ResponseEntity<List<Map<String, Object>>>> list(
+            @AuthenticationPrincipal String userId,
+            @RequestParam(required = false) String categoryId) {
+        return Mono.fromCallable(() -> noteRepository.list(userId, categoryId))
+                .subscribeOn(Schedulers.boundedElastic())
+                .map(ResponseEntity::ok);
+    }
+
+    @GetMapping("/{id}")
+    public Mono<ResponseEntity<Map<String, Object>>> getById(
+            @AuthenticationPrincipal String userId,
+            @PathVariable String id) {
+        return Mono.fromCallable(() -> {
+            Map<String, Object> note = noteRepository.findById(userId, id);
+            if (note == null) return ResponseEntity.notFound().<Map<String, Object>>build();
+            return ResponseEntity.ok(note);
+        }).subscribeOn(Schedulers.boundedElastic());
+    }
+
+    @PostMapping
+    public Mono<ResponseEntity<Map<String, Object>>> create(
+            @AuthenticationPrincipal String userId,
+            @RequestBody Map<String, String> body) {
+        return Mono.fromCallable(() -> {
+            String title = body.getOrDefault("title", "");
+            String content = body.getOrDefault("content", "");
+            String categoryId = body.get("categoryId");
+            String id = noteRepository.insert(userId, title, content, "TEXT", null, categoryId);
+            return ResponseEntity.ok(Map.<String, Object>of("id", id));
+        }).subscribeOn(Schedulers.boundedElastic());
+    }
+
+    @PatchMapping("/{id}")
+    public Mono<ResponseEntity<Map<String, Object>>> update(
+            @AuthenticationPrincipal String userId,
+            @PathVariable String id,
+            @RequestBody Map<String, String> body) {
+        return Mono.fromCallable(() -> {
+            String title = body.get("title");
+            String content = body.get("content");
+            String categoryId = body.get("categoryId");
+            noteRepository.update(id, userId, title, content, categoryId);
+            return ResponseEntity.ok(noteRepository.findById(userId, id));
+        }).subscribeOn(Schedulers.boundedElastic());
+    }
+
+    /**
+     * 기존 노트의 내용을 LLM으로 교정 + 요약 재실행
+     */
+    @PostMapping("/{id}/polish")
+    public Mono<ResponseEntity<Map<String, Object>>> polishNote(
+            @AuthenticationPrincipal String userId,
+            @PathVariable String id) {
+        return Mono.fromCallable(() -> {
+            Map<String, Object> note = noteRepository.findById(userId, id);
+            if (note == null) return ResponseEntity.notFound().<Map<String, Object>>build();
+
+            String content = note.get("CONTENT") != null ? note.get("CONTENT").toString() : "";
+            if (content.isBlank()) return ResponseEntity.badRequest().<Map<String, Object>>build();
+
+            // raw_content가 있으면 그걸 사용, 없으면 content에서 전문 추출
+            Object rawObj = note.get("RAW_CONTENT");
+            String rawText = (rawObj != null && !rawObj.toString().isBlank()) ? rawObj.toString() : content;
+            if (rawText.contains("# 전문")) {
+                int idx = rawText.indexOf("# 전문");
+                rawText = rawText.substring(idx + "# 전문".length()).strip();
+            }
+
+            String noteType = note.get("NOTE_TYPE") != null ? note.get("NOTE_TYPE").toString() : "TEXT";
+            boolean isAudio = "AUDIO".equals(noteType) || note.get("AUDIO_PATH") != null;
+
+            noteRepository.updateNoteType(id, "TRANSCRIBING");
+
+            final String finalRawText = rawText;
+            Schedulers.boundedElastic().schedule(() -> {
+                try {
+                    noteRepository.updateContent(id, finalRawText + "\n\n--- 텍스트 교정 중... ---");
+                    String polished = polishTranscription(finalRawText);
+
+                    noteRepository.updateContent(id, polished + "\n\n--- 요약 생성 중... ---");
+                    String summary = summarizeTranscription(polished);
+
+                    String result = "# 요약\n\n" + summary + "\n\n---\n\n# 전문\n\n" + polished;
+                    String newTitle = generateAudioTitle(summary, java.time.LocalDateTime.now());
+                    noteRepository.update(id, null, newTitle, result, null);
+                    noteRepository.updateNoteType(id, isAudio ? "AUDIO" : "TEXT");
+                    log.info("Polish + summary complete for note {}", id);
+                } catch (Exception e) {
+                    log.error("Polish failed for note {}", id, e);
+                    noteRepository.updateNoteType(id, isAudio ? "AUDIO" : "TEXT");
+                }
+            });
+
+            return ResponseEntity.ok(Map.<String, Object>of("status", "processing"));
+        }).subscribeOn(Schedulers.boundedElastic());
+    }
+
+    @DeleteMapping("/{id}")
+    public Mono<ResponseEntity<Void>> delete(
+            @AuthenticationPrincipal String userId,
+            @PathVariable String id) {
+        return Mono.fromRunnable(() -> noteRepository.delete(id, userId))
+                .subscribeOn(Schedulers.boundedElastic())
+                .then(Mono.just(ResponseEntity.ok().<Void>build()));
+    }
+
+    /**
+     * 오디오 파일 업로드 → Gemma 4 STT → 텍스트 노트 생성
+     */
+    @PostMapping("/audio")
+    public Mono<ResponseEntity<Map<String, Object>>> uploadAudio(
+            @AuthenticationPrincipal String userId,
+            @RequestPart("file") FilePart filePart,
+            @RequestPart(value = "title", required = false) String title,
+            @RequestPart(value = "categoryId", required = false) String categoryId) {
+        final String inputTitle = (title != null && !title.isBlank()) ? title : "음성 변환 중...";
+        final String inputCategoryId = categoryId;
+        return Mono.fromCallable(() -> {
+            // 1. 파일 저장
+            String fileName = System.currentTimeMillis() + "_" + filePart.filename();
+            Path audioFile = AUDIO_DIR.resolve(fileName);
+            filePart.transferTo(audioFile).block();
+            log.info("Audio file saved: {} ({} bytes)", audioFile, Files.size(audioFile));
+
+            // 2. 노트 즉시 생성 (TRANSCRIBING 상태)
+            String id = noteRepository.insert(userId, inputTitle, "음성 변환을 시작합니다...", "TRANSCRIBING", fileName, inputCategoryId);
+
+            // 3. 백그라운드에서 STT 실행
+            Schedulers.boundedElastic().schedule(() -> {
+                try {
+                    transcribeAsync(id, audioFile, inputTitle);
+                } catch (Exception e) {
+                    log.error("Async transcription failed for note {}", id, e);
+                    noteRepository.updateContent(id, "음성 변환에 실패했습니다: " + e.getMessage());
+                    noteRepository.updateNoteType(id, "AUDIO_FAILED");
+                }
+            });
+
+            return ResponseEntity.ok(Map.<String, Object>of("id", id));
+        }).subscribeOn(Schedulers.boundedElastic());
+    }
+
+    /**
+     * 비동기 STT 처리.
+     * Step 1: OpenRouter (Gemini) STT → raw_content에 저장
+     * Step 2: OCI GenAI로 교정 → content에 저장
+     * Step 3: OCI GenAI로 요약 → content 앞에 추가
+     */
+    private void transcribeAsync(String noteId, Path audioFile, String inputTitle) throws IOException, InterruptedException {
+        // === Step 1: STT (OpenRouter Gemini) ===
+        String rawResult = null;
+
+        if (openRouterApiKey != null && !openRouterApiKey.isBlank()) {
+            try {
+                noteRepository.updateContent(noteId, "Gemini로 음성 변환 중...");
+                rawResult = transcribeWithOpenRouter(audioFile);
+                log.info("OpenRouter STT: {} chars", rawResult != null ? rawResult.length() : 0);
+            } catch (Exception e) {
+                log.warn("OpenRouter STT failed: {}", e.getMessage());
+                noteRepository.updateContent(noteId, "Gemini STT 실패: " + e.getMessage());
+            }
+        }
+
+        // Gemma fallback (OpenRouter 실패 시)
+        if (rawResult == null || rawResult.isBlank()) {
+            try {
+                noteRepository.updateContent(noteId, "Gemma로 음성 변환 중...");
+                Path wavFile = convertToWav(audioFile);
+                rawResult = transcribeChunk(wavFile);
+                cleanup(wavFile, audioFile);
+            } catch (Exception e) {
+                log.error("All STT failed for note {}", noteId, e);
+                noteRepository.updateContent(noteId, "모든 음성 변환 실패: " + e.getMessage());
+                noteRepository.updateNoteType(noteId, "AUDIO_FAILED");
+                return;
+            }
+        }
+
+        if (rawResult == null || rawResult.isBlank()) {
+            noteRepository.updateContent(noteId, "음성 변환 결과가 비어있습니다.");
+            noteRepository.updateNoteType(noteId, "AUDIO_FAILED");
+            return;
+        }
+
+        // raw 텍스트를 별도 컬럼에 저장 + content에도 일단 저장
+        noteRepository.updateRawContent(noteId, rawResult);
+        noteRepository.updateContent(noteId, rawResult);
+        String sttTitle = java.time.LocalDateTime.now().format(
+                java.time.format.DateTimeFormatter.ofPattern("yyyy-MM-dd HH:mm")) + " 음성 메모";
+        noteRepository.update(noteId, null,
+                inputTitle.equals("음성 변환 중...") ? sttTitle : inputTitle,
+                rawResult, null);
+        noteRepository.updateNoteType(noteId, "AUDIO");
+        log.info("STT raw saved: {} chars", rawResult.length());
+
+        // === Step 2: 교정 (OCI GenAI) ===
+        try {
+            noteRepository.updateNoteType(noteId, "TRANSCRIBING");
+            noteRepository.updateContent(noteId, rawResult + "\n\n--- 텍스트 교정 중 (OCI GenAI)... ---");
+            String polished = polishTranscription(rawResult);
+            log.info("Polish complete: {} chars", polished.length());
+
+            // === Step 3: 요약 (OCI GenAI) ===
+            noteRepository.updateContent(noteId, polished + "\n\n--- 요약 생성 중... ---");
+            String summary = summarizeTranscription(polished);
+            log.info("Summary complete: {} chars", summary.length());
+
+            // 최종 결과 저장
+            String result = "# 요약\n\n" + summary + "\n\n---\n\n# 전문\n\n" + polished;
+            String finalTitle = inputTitle.equals("음성 변환 중...")
+                    ? generateAudioTitle(summary, java.time.LocalDateTime.now())
+                    : inputTitle;
+            noteRepository.update(noteId, null, finalTitle, result, null);
+            log.info("Final note saved: {} chars", result.length());
+        } catch (Exception e) {
+            log.warn("Polish/summary failed, keeping raw STT text: {}", e.getMessage());
+        }
+
+        noteRepository.updateNoteType(noteId, "AUDIO");
+    }
+
+    /**
+     * Gemma 4 E4B를 사용하여 오디오 파일을 텍스트로 변환
+     */
+    /**
+     * 오디오 파일을 wav로 변환한다 (Ollama 호환성).
+     */
+    private Path convertToWav(Path audioFile) throws IOException, InterruptedException {
+        String name = audioFile.getFileName().toString();
+        if (name.toLowerCase().endsWith(".wav")) return audioFile;
+
+        Path wavFile = audioFile.getParent().resolve(name.replaceAll("\\.[^.]+$", "") + ".wav");
+        ProcessBuilder pb = new ProcessBuilder(
+                "ffmpeg", "-i", audioFile.toString(),
+                "-ar", "16000", "-ac", "1", "-y",
+                wavFile.toString()
+        );
+        pb.redirectErrorStream(true);
+        Process proc = pb.start();
+        String output = new String(proc.getInputStream().readAllBytes());
+        int exitCode = proc.waitFor();
+        if (exitCode != 0) {
+            log.error("ffmpeg conversion failed (exit {}): {}", exitCode, output.substring(0, Math.min(500, output.length())));
+            throw new IOException("오디오 변환 실패 (ffmpeg exit " + exitCode + ")");
+        }
+        log.info("Converted {} to wav: {} bytes", name, Files.size(wavFile));
+        return wavFile;
+    }
+
+    private static final int CHUNK_SECONDS = 180; // 3분 단위 분할
+
+    private String transcribeWithGemma(Path audioFile) throws IOException, InterruptedException {
+        Path wavFile = convertToWav(audioFile);
+        double duration = getAudioDuration(wavFile);
+        log.info("Audio duration: {}s", duration);
+
+        if (duration <= CHUNK_SECONDS) {
+            String result = transcribeChunk(wavFile);
+            cleanup(wavFile, audioFile);
+            return result;
+        }
+
+        // 긴 오디오: 3분 단위로 분할
+        int chunks = (int) Math.ceil(duration / CHUNK_SECONDS);
+        log.info("Splitting audio into {} chunks of {}s", chunks, CHUNK_SECONDS);
+
+        StringBuilder fullText = new StringBuilder();
+        for (int i = 0; i < chunks; i++) {
+            int start = i * CHUNK_SECONDS;
+            Path chunkFile = wavFile.getParent().resolve("chunk_" + i + "_" + System.currentTimeMillis() + ".wav");
+
+            ProcessBuilder pb = new ProcessBuilder(
+                    "ffmpeg", "-i", wavFile.toString(),
+                    "-ss", String.valueOf(start), "-t", String.valueOf(CHUNK_SECONDS),
+                    "-ar", "16000", "-ac", "1", "-y", chunkFile.toString()
+            );
+            pb.redirectErrorStream(true);
+            Process proc = pb.start();
+            proc.getInputStream().readAllBytes();
+            proc.waitFor();
+
+            log.info("Transcribing chunk {}/{} ({}s-{}s)", i + 1, chunks, start, Math.min(start + CHUNK_SECONDS, (int) duration));
+
+            try {
+                String chunkText = transcribeChunk(chunkFile);
+                if (!chunkText.isBlank()) {
+                    if (fullText.length() > 0) fullText.append("\n\n");
+                    fullText.append(chunkText);
+                }
+            } catch (Exception e) {
+                log.warn("Chunk {} failed: {}", i + 1, e.getMessage());
+                fullText.append("\n\n[chunk ").append(i + 1).append(" 변환 실패]");
+            } finally {
+                try { Files.deleteIfExists(chunkFile); } catch (Exception ignored) {}
+            }
+        }
+
+        cleanup(wavFile, audioFile);
+        String result = fullText.toString().strip();
+        if (result.isBlank()) throw new IOException("Gemma STT returned empty for all chunks");
+        return result;
+    }
+
+    private String transcribeChunk(Path wavFile) throws IOException, InterruptedException {
+        byte[] audioBytes = Files.readAllBytes(wavFile);
+        String base64Audio = Base64.getEncoder().encodeToString(audioBytes);
+        log.info("Chunk base64: {} chars ({} MB)", base64Audio.length(), audioBytes.length / 1024 / 1024);
+
+        String payload = """
+                {
+                  "model": "gemma4:e4b",
+                  "messages": [{"role": "user", "content": "Transcribe the following audio to text accurately. Output only the spoken content in its original language. Do not add any description or translation.", "images": ["%s"]}],
+                  "stream": false,
+                  "options": {"num_ctx": 8000}
+                }
+                """.formatted(base64Audio);
+
+        HttpRequest request = HttpRequest.newBuilder()
+                .uri(URI.create("http://localhost:11434/api/chat"))
+                .header("Content-Type", "application/json")
+                .POST(HttpRequest.BodyPublishers.ofString(payload))
+                .timeout(java.time.Duration.ofMinutes(10))
+                .build();
+
+        HttpResponse<String> response = httpClient.send(request, HttpResponse.BodyHandlers.ofString());
+        if (response.statusCode() != 200) {
+            log.error("Gemma STT error {}: {}", response.statusCode(), response.body().substring(0, Math.min(500, response.body().length())));
+            throw new IOException("Gemma STT failed: HTTP " + response.statusCode());
+        }
+
+        var root = new com.fasterxml.jackson.databind.ObjectMapper().readTree(response.body());
+        return root.path("message").path("content").asText("").strip();
+    }
+
+    /**
+     * STT 결과를 LLM으로 교정한다.
+     * 발음 오인식 보정, 문장 구분, 불필요한 추임새 제거, 가독성 향상.
+     */
+    private String polishTranscription(String rawText) {
+        if (!genAiService.isConfigured()) {
+            log.info("GenAI not configured, skipping polish");
+            return rawText;
+        }
+
+        try {
+            String systemMsg =
+                    "당신은 전문 속기사입니다. 음성 인식(STT) 텍스트를 교정해주세요.\n\n" +
+                    "## 규칙\n" +
+                    "1. 발음 오인식 단어를 문맥에 맞게 보정하세요.\n" +
+                    "2. 추임새(어, 음, 그, 아, 뭐, 이제, 근데)를 제거하세요.\n" +
+                    "3. 문장 부호를 넣고 단락을 나누세요.\n" +
+                    "4. 절대 요약하지 마세요. 원문의 모든 내용을 빠짐없이 유지하세요.\n" +
+                    "5. 내용을 추가하거나 삭제하지 마세요. 교정만 하세요.\n" +
+                    "6. 전문 용어와 고유 명사는 올바르게 표기하세요.\n" +
+                    "7. 입력 텍스트와 비슷한 분량으로 출력하세요. 줄이지 마세요.\n" +
+                    "8. Markdown 형식으로 출력하세요.";
+
+            // maxTokens 65536이므로 대부분 한 번에 처리 가능
+            if (rawText.length() <= 30000) {
+                log.info("Polishing in single call: {} chars", rawText.length());
+                return genAiService.chat(systemMsg,
+                        "아래 STT 텍스트를 교정해주세요. 전체 내용을 빠짐없이 유지하세요:\n\n" + rawText, null).strip();
+            }
+
+            // 30000자 이상만 분할
+            StringBuilder polished = new StringBuilder();
+            int chunkSize = 20000;
+            int totalChunks = (int) Math.ceil((double) rawText.length() / chunkSize);
+            for (int i = 0; i < rawText.length(); i += chunkSize) {
+                int chunkNum = (i / chunkSize) + 1;
+                String chunk = rawText.substring(i, Math.min(i + chunkSize, rawText.length()));
+                log.info("Polishing chunk {}/{}: {} chars", chunkNum, totalChunks, chunk.length());
+                String result = genAiService.chat(systemMsg,
+                        "아래 STT 텍스트를 교정해주세요. 전체 내용을 빠짐없이 유지하세요:\n\n" + chunk, null).strip();
+                if (polished.length() > 0) polished.append("\n\n");
+                polished.append(result);
+            }
+            return polished.toString();
+        } catch (Exception e) {
+            log.warn("Polish transcription failed, returning raw text: {}", e.getMessage());
+            return rawText;
+        }
+    }
+
+    /**
+     * 교정된 텍스트를 요약한다.
+     */
+    private String summarizeTranscription(String polishedText) {
+        if (!genAiService.isConfigured()) return "";
+
+        try {
+            String systemMsg =
+                    "당신은 회의록/녹음 요약 전문가입니다. 아래 텍스트를 요약해주세요.\n\n" +
+                    "## 규칙\n" +
+                    "1. 주요 논의 주제별로 소제목(##)을 나누어 요약하세요.\n" +
+                    "2. 각 주제 아래 핵심 내용을 불릿 포인트로 정리하세요.\n" +
+                    "3. 주요 결정 사항, 액션 아이템이 있다면 별도로 표시하세요.\n" +
+                    "4. 원문과 같은 언어로 작성하세요.\n" +
+                    "5. Markdown 형식으로 작성하세요.\n" +
+                    "6. 원본 길이에 비례하여 요약하세요. 긴 내용은 상세하게, 짧은 내용은 간결하게.\n" +
+                    "7. 중요한 수치, 이름, 기술명은 빠뜨리지 마세요.";
+
+            String content = polishedText.length() > 15000
+                    ? polishedText.substring(0, 15000) : polishedText;
+            return genAiService.chat(systemMsg, "아래 내용을 요약해주세요:\n\n" + content, null).strip();
+        } catch (Exception e) {
+            log.warn("Summarization failed: {}", e.getMessage());
+            return "";
+        }
+    }
+
+    /**
+     * LLM으로 음성 메모 제목을 생성한다. "일시 - 핵심 주제" 형태.
+     */
+    private String generateAudioTitle(String summary, java.time.LocalDateTime dateTime) {
+        if (!genAiService.isConfigured() || summary.isBlank()) {
+            return dateTime.format(java.time.format.DateTimeFormatter.ofPattern("yyyy-MM-dd HH:mm")) + " 음성 메모";
+        }
+
+        try {
+            String systemMsg = "음성 메모의 요약을 보고 10자 이내의 짧은 제목을 생성해주세요. " +
+                    "제목만 출력하세요. 따옴표, 설명, 접두사 없이 제목만.";
+            String title = genAiService.chat(systemMsg, summary, null).strip()
+                    .replaceAll("^\"|\"$", "").replaceAll("^'|'$", "");
+            if (title.length() > 40) title = title.substring(0, 40);
+            return dateTime.format(java.time.format.DateTimeFormatter.ofPattern("yyyy-MM-dd HH:mm")) + " " + title;
+        } catch (Exception e) {
+            log.warn("Title generation failed: {}", e.getMessage());
+            return dateTime.format(java.time.format.DateTimeFormatter.ofPattern("yyyy-MM-dd HH:mm")) + " 음성 메모";
+        }
+    }
+
+    /**
+     * OpenRouter API (Gemini 2.5 Flash)를 사용하여 오디오 STT. 한 번에 전체 파일 처리 가능.
+     */
+    private String transcribeWithOpenRouter(Path audioFile) throws IOException, InterruptedException {
+        byte[] audioBytes = Files.readAllBytes(audioFile);
+        String base64Audio = Base64.getEncoder().encodeToString(audioBytes);
+
+        String mimeType = "audio/wav";
+        String name = audioFile.getFileName().toString().toLowerCase();
+        if (name.endsWith(".mp3")) mimeType = "audio/mpeg";
+        else if (name.endsWith(".m4a")) mimeType = "audio/mp4";
+        else if (name.endsWith(".ogg")) mimeType = "audio/ogg";
+        else if (name.endsWith(".webm")) mimeType = "audio/webm";
+        else if (name.endsWith(".flac")) mimeType = "audio/flac";
+
+        log.info("OpenRouter STT: {} ({} MB, {})", name, audioBytes.length / 1024 / 1024, mimeType);
+
+        // OpenRouter chat/completions API with audio input
+        String payload = new com.fasterxml.jackson.databind.ObjectMapper().writeValueAsString(Map.of(
+            "model", openRouterModel,
+            "messages", List.of(Map.of(
+                "role", "user",
+                "content", List.of(
+                    Map.of("type", "input_audio", "input_audio", Map.of(
+                        "data", base64Audio,
+                        "format", mimeType.substring(mimeType.indexOf('/') + 1)
+                    )),
+                    Map.of("type", "text", "text",
+                        "Transcribe the audio accurately. Output only the spoken content in its original language. " +
+                        "Do not add description, annotation, timestamps, or translation. " +
+                        "If the audio contains Korean, output in Korean.")
+                )
+            ))
+        ));
+
+        HttpRequest request = HttpRequest.newBuilder()
+                .uri(URI.create("https://openrouter.ai/api/v1/chat/completions"))
+                .header("Content-Type", "application/json")
+                .header("Authorization", "Bearer " + openRouterApiKey)
+                .POST(HttpRequest.BodyPublishers.ofString(payload))
+                .timeout(java.time.Duration.ofMinutes(10))
+                .build();
+
+        HttpResponse<String> response = httpClient.send(request, HttpResponse.BodyHandlers.ofString());
+
+        if (response.statusCode() != 200) {
+            log.error("OpenRouter STT error {}: {}", response.statusCode(),
+                    response.body().substring(0, Math.min(500, response.body().length())));
+            throw new IOException("OpenRouter STT failed: HTTP " + response.statusCode());
+        }
+
+        var root = new com.fasterxml.jackson.databind.ObjectMapper().readTree(response.body());
+        String text = root.path("choices").path(0).path("message").path("content").asText("").strip();
+
+        if (text.isBlank()) {
+            throw new IOException("OpenRouter STT returned empty result");
+        }
+
+        return text;
+    }
+
+    private double getAudioDuration(Path audioFile) throws IOException, InterruptedException {
+        ProcessBuilder pb = new ProcessBuilder("ffprobe", "-i", audioFile.toString(),
+                "-show_entries", "format=duration", "-v", "quiet", "-of", "csv=p=0");
+        pb.redirectErrorStream(true);
+        Process proc = pb.start();
+        String output = new String(proc.getInputStream().readAllBytes()).strip();
+        proc.waitFor();
+        try { return Double.parseDouble(output); } catch (NumberFormatException e) { return 0; }
+    }
+
+    private void cleanup(Path wavFile, Path originalFile) {
+        if (!wavFile.equals(originalFile)) {
+            try { Files.deleteIfExists(wavFile); } catch (Exception ignored) {}
+        }
+    }
+}
--- a/sundol-backend/src/main/java/com/sundol/repository/NoteRepository.java
+++ b/sundol-backend/src/main/java/com/sundol/repository/NoteRepository.java
@@ -0,0 +1,148 @@
+package com.sundol.repository;
+
+import org.springframework.jdbc.core.JdbcTemplate;
+import org.springframework.stereotype.Repository;
+
+import java.sql.Clob;
+import java.util.List;
+import java.util.Map;
+
+@Repository
+public class NoteRepository {
+
+    private final JdbcTemplate jdbcTemplate;
+
+    public NoteRepository(JdbcTemplate jdbcTemplate) {
+        this.jdbcTemplate = jdbcTemplate;
+    }
+
+    public String insert(String userId, String title, String content, String noteType, String audioPath, String categoryId) {
+        if (categoryId != null) {
+            jdbcTemplate.update(
+                "INSERT INTO notes (id, user_id, title, content, note_type, audio_path, category_id, created_at, updated_at) " +
+                "VALUES (SYS_GUID(), HEXTORAW(?), ?, ?, ?, ?, HEXTORAW(?), SYSTIMESTAMP, SYSTIMESTAMP)",
+                new Object[]{userId, title, content, noteType, audioPath, categoryId},
+                new int[]{java.sql.Types.VARCHAR, java.sql.Types.VARCHAR, java.sql.Types.CLOB, java.sql.Types.VARCHAR, java.sql.Types.VARCHAR, java.sql.Types.VARCHAR}
+            );
+        } else {
+            jdbcTemplate.update(
+                "INSERT INTO notes (id, user_id, title, content, note_type, audio_path, created_at, updated_at) " +
+                "VALUES (SYS_GUID(), HEXTORAW(?), ?, ?, ?, ?, SYSTIMESTAMP, SYSTIMESTAMP)",
+                new Object[]{userId, title, content, noteType, audioPath},
+                new int[]{java.sql.Types.VARCHAR, java.sql.Types.VARCHAR, java.sql.Types.CLOB, java.sql.Types.VARCHAR, java.sql.Types.VARCHAR}
+            );
+        }
+        var result = jdbcTemplate.queryForList(
+            "SELECT RAWTOHEX(id) AS id FROM notes WHERE user_id = HEXTORAW(?) ORDER BY created_at DESC FETCH FIRST 1 ROW ONLY",
+            userId
+        );
+        return (String) result.get(0).get("ID");
+    }
+
+    public List<Map<String, Object>> list(String userId, String categoryId) {
+        if (categoryId != null && !categoryId.isBlank()) {
+            return jdbcTemplate.queryForList(
+                "SELECT RAWTOHEX(n.id) AS id, n.title, n.note_type, n.audio_path, " +
+                "  RAWTOHEX(n.category_id) AS category_id, c.full_path AS category_path, " +
+                "  n.created_at, n.updated_at " +
+                "FROM notes n LEFT JOIN categories c ON c.id = n.category_id " +
+                "WHERE n.user_id = HEXTORAW(?) AND n.category_id = HEXTORAW(?) " +
+                "ORDER BY n.created_at DESC",
+                userId, categoryId
+            );
+        }
+        return jdbcTemplate.queryForList(
+            "SELECT RAWTOHEX(n.id) AS id, n.title, n.note_type, n.audio_path, " +
+            "  RAWTOHEX(n.category_id) AS category_id, c.full_path AS category_path, " +
+            "  n.created_at, n.updated_at " +
+            "FROM notes n LEFT JOIN categories c ON c.id = n.category_id " +
+            "WHERE n.user_id = HEXTORAW(?) " +
+            "ORDER BY n.created_at DESC",
+            userId
+        );
+    }
+
+    public Map<String, Object> findById(String userId, String id) {
+        var results = jdbcTemplate.queryForList(
+            "SELECT RAWTOHEX(n.id) AS id, n.title, n.content, n.raw_content, n.note_type, n.audio_path, " +
+            "  RAWTOHEX(n.category_id) AS category_id, c.full_path AS category_path, " +
+            "  n.created_at, n.updated_at " +
+            "FROM notes n LEFT JOIN categories c ON c.id = n.category_id " +
+            "WHERE RAWTOHEX(n.id) = ? AND n.user_id = HEXTORAW(?)",
+            id, userId
+        );
+        if (results.isEmpty()) return null;
+        return convertClobFields(results.get(0));
+    }
+
+    public void update(String id, String userId, String title, String content, String categoryId) {
+        if (userId != null) {
+            if (categoryId != null) {
+                jdbcTemplate.update(
+                    "UPDATE notes SET title = ?, content = ?, category_id = HEXTORAW(?), updated_at = SYSTIMESTAMP " +
+                    "WHERE RAWTOHEX(id) = ? AND user_id = HEXTORAW(?)",
+                    new Object[]{title, content, categoryId, id, userId},
+                    new int[]{java.sql.Types.VARCHAR, java.sql.Types.CLOB, java.sql.Types.VARCHAR, java.sql.Types.VARCHAR, java.sql.Types.VARCHAR}
+                );
+            } else {
+                jdbcTemplate.update(
+                    "UPDATE notes SET title = ?, content = ?, updated_at = SYSTIMESTAMP " +
+                    "WHERE RAWTOHEX(id) = ? AND user_id = HEXTORAW(?)",
+                    new Object[]{title, content, id, userId},
+                    new int[]{java.sql.Types.VARCHAR, java.sql.Types.CLOB, java.sql.Types.VARCHAR, java.sql.Types.VARCHAR}
+                );
+            }
+        } else {
+            // 내부 호출 (userId 없음)
+            jdbcTemplate.update(
+                "UPDATE notes SET title = ?, content = ?, updated_at = SYSTIMESTAMP WHERE RAWTOHEX(id) = ?",
+                new Object[]{title, content, id},
+                new int[]{java.sql.Types.VARCHAR, java.sql.Types.CLOB, java.sql.Types.VARCHAR}
+            );
+        }
+    }
+
+    public void updateRawContent(String id, String rawContent) {
+        jdbcTemplate.update(
+            "UPDATE notes SET raw_content = ?, updated_at = SYSTIMESTAMP WHERE RAWTOHEX(id) = ?",
+            new Object[]{rawContent, id},
+            new int[]{java.sql.Types.CLOB, java.sql.Types.VARCHAR}
+        );
+    }
+
+    public void updateContent(String id, String content) {
+        jdbcTemplate.update(
+            "UPDATE notes SET content = ?, updated_at = SYSTIMESTAMP WHERE RAWTOHEX(id) = ?",
+            new Object[]{content, id},
+            new int[]{java.sql.Types.CLOB, java.sql.Types.VARCHAR}
+        );
+    }
+
+    public void updateNoteType(String id, String noteType) {
+        jdbcTemplate.update(
+            "UPDATE notes SET note_type = ?, updated_at = SYSTIMESTAMP WHERE RAWTOHEX(id) = ?",
+            noteType, id
+        );
+    }
+
+    public void delete(String id, String userId) {
+        jdbcTemplate.update(
+            "DELETE FROM notes WHERE RAWTOHEX(id) = ? AND user_id = HEXTORAW(?)",
+            id, userId
+        );
+    }
+
+    private Map<String, Object> convertClobFields(Map<String, Object> row) {
+        for (var entry : row.entrySet()) {
+            Object val = entry.getValue();
+            if (val instanceof Clob clob) {
+                try {
+                    entry.setValue(clob.getSubString(1, (int) clob.length()));
+                } catch (Exception e) {
+                    entry.setValue(null);
+                }
+            }
+        }
+        return row;
+    }
+}
--- a/sundol-backend/src/main/java/com/sundol/service/OciGenAiService.java
+++ b/sundol-backend/src/main/java/com/sundol/service/OciGenAiService.java
@@ -96,7 +96,7 @@ public class OciGenAiService {
                    Map.of("role", "SYSTEM", "content", List.of(Map.of("type", "TEXT", "text", systemMessage))),
                    Map.of("role", "USER", "content", List.of(Map.of("type", "TEXT", "text", userMessage)))
                ),
-                "maxTokens", 4096,
+                "maxTokens", 65536,
                "temperature", 0.3
            )
        );
--- a/sundol-backend/src/main/java/com/sundol/service/PlaywrightBrowserService.java
+++ b/sundol-backend/src/main/java/com/sundol/service/PlaywrightBrowserService.java
@@ -20,7 +20,7 @@ import java.util.List;
 public class PlaywrightBrowserService {

    private static final Logger log = LoggerFactory.getLogger(PlaywrightBrowserService.class);
-    private static final String CDP_URL = "http://localhost:9222";
+    private static final String CDP_URL = "http://127.0.0.1:9222";

    private Playwright playwright;
    private Browser browser;
--- a/sundol-backend/src/main/resources/application.yml
+++ b/sundol-backend/src/main/resources/application.yml
@@ -29,6 +29,10 @@ oci:
    model: ${OCI_GENAI_MODEL:google.gemini-2.5-flash}
    base-url: ${OCI_GENAI_BASE_URL:https://inference.generativeai.us-chicago-1.oci.oraclecloud.com/20231130/actions}

+openrouter:
+  api-key: ${OPENROUTER_API_KEY:}
+  model: ${OPENROUTER_MODEL:google/gemini-2.5-flash}
+
 jina:
  reader:
    api-key: ${JINA_READER_API_KEY:}
--- a/sundol-frontend/src/app/knowledge/[id]/page.tsx
+++ b/sundol-frontend/src/app/knowledge/[id]/page.tsx
@@ -6,6 +6,7 @@ import AuthGuard from "@/components/auth-guard";
 import NavBar from "@/components/nav-bar";
 import { useApi } from "@/lib/use-api";
 import ReactMarkdown from "react-markdown";
+import SpeakableText from "@/components/speakable-text";

 interface Category {
  ID: string;
@@ -314,10 +315,18 @@ export default function KnowledgeDetailPage() {
                      h1: ({children}) => <h1 className="text-xl font-bold mt-6 mb-3">{children}</h1>,
                      h2: ({children}) => <h2 className="text-lg font-bold mt-5 mb-2">{children}</h2>,
                      h3: ({children}) => <h3 className="text-base font-bold mt-4 mb-2">{children}</h3>,
-                      p: ({children}) => <p className="mb-3">{children}</p>,
+                      p: ({children, node}) => {
+                        // eslint-disable-next-line @typescript-eslint/no-explicit-any
+                        const txt = node?.children?.map((c: any) => c.type === 'text' ? c.value : '').join('') || '';
+                        return <p className="mb-3"><SpeakableText text={txt}>{children}</SpeakableText></p>;
+                      },
                      ul: ({children}) => <ul className="list-disc ml-5 mb-3 space-y-1">{children}</ul>,
                      ol: ({children}) => <ol className="list-decimal ml-5 mb-3 space-y-1">{children}</ol>,
-                      li: ({children}) => <li className="leading-relaxed">{children}</li>,
+                      li: ({children, node}) => {
+                        // eslint-disable-next-line @typescript-eslint/no-explicit-any
+                        const txt = node?.children?.map((c: any) => c.type === 'text' ? c.value : '').join('') || '';
+                        return <li className="leading-relaxed"><SpeakableText text={txt}>{children}</SpeakableText></li>;
+                      },
                      strong: ({children}) => <strong className="font-bold">{children}</strong>,
                      blockquote: ({children}) => <blockquote className="border-l-2 border-[var(--color-primary)] pl-4 my-3 italic text-[var(--color-text-muted)]">{children}</blockquote>,
                      code: ({children}) => <code className="bg-[var(--color-bg-hover)] px-1.5 py-0.5 rounded text-xs">{children}</code>,
--- a/sundol-frontend/src/app/notes/[id]/page.tsx
+++ b/sundol-frontend/src/app/notes/[id]/page.tsx
@@ -0,0 +1,284 @@
+"use client";
+
+import { useEffect, useState } from "react";
+import { useParams, useRouter } from "next/navigation";
+import AuthGuard from "@/components/auth-guard";
+import NavBar from "@/components/nav-bar";
+import { useApi } from "@/lib/use-api";
+import ReactMarkdown from "react-markdown";
+import SpeakableText from "@/components/speakable-text";
+
+interface NoteDetail {
+  ID: string;
+  TITLE: string;
+  CONTENT: string;
+  RAW_CONTENT: string | null;
+  NOTE_TYPE: string;
+  AUDIO_PATH: string | null;
+  CATEGORY_PATH: string | null;
+  CREATED_AT: string;
+  UPDATED_AT: string;
+}
+
+export default function NoteDetailPage() {
+  const { request } = useApi();
+  const router = useRouter();
+  const params = useParams();
+  const id = params.id as string;
+
+  const [note, setNote] = useState<NoteDetail | null>(null);
+  const [loading, setLoading] = useState(true);
+  const [editing, setEditing] = useState(false);
+  const [editTitle, setEditTitle] = useState("");
+  const [editContent, setEditContent] = useState("");
+  const [saving, setSaving] = useState(false);
+  const [deleting, setDeleting] = useState(false);
+  const [polishing, setPolishing] = useState(false);
+  const [showRaw, setShowRaw] = useState(false);
+
+  const fetchNote = async () => {
+    try {
+      const data = await request<NoteDetail>({ method: "GET", url: `/api/notes/${id}` });
+      setNote(data);
+      setEditTitle(data.TITLE || "");
+      setEditContent(data.CONTENT || "");
+    } catch (err) {
+      console.error("Failed to load note:", err);
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  useEffect(() => {
+    fetchNote();
+  }, [id]);
+
+  // TRANSCRIBING 상태면 3초 폴링
+  useEffect(() => {
+    if (!note || note.NOTE_TYPE !== "TRANSCRIBING") return;
+    const interval = setInterval(fetchNote, 3000);
+    return () => clearInterval(interval);
+  }, [note?.NOTE_TYPE]);
+
+  const handleSave = async () => {
+    setSaving(true);
+    try {
+      const updated = await request<NoteDetail>({
+        method: "PATCH",
+        url: `/api/notes/${id}`,
+        data: { title: editTitle, content: editContent },
+      });
+      setNote(updated);
+      setEditing(false);
+    } catch (err) {
+      console.error("Failed to update note:", err);
+      alert("저장에 실패했습니다.");
+    } finally {
+      setSaving(false);
+    }
+  };
+
+  const handleDelete = async () => {
+    if (!confirm("정말 삭제하시겠습니까?")) return;
+    setDeleting(true);
+    try {
+      await request({ method: "DELETE", url: `/api/notes/${id}` });
+      router.push("/notes");
+    } catch (err) {
+      console.error("Failed to delete note:", err);
+      setDeleting(false);
+    }
+  };
+
+  if (loading) {
+    return (
+      <AuthGuard><NavBar />
+        <main className="max-w-4xl mx-auto px-4 py-8">
+          <p className="text-[var(--color-text-muted)]">Loading...</p>
+        </main>
+      </AuthGuard>
+    );
+  }
+
+  if (!note) {
+    return (
+      <AuthGuard><NavBar />
+        <main className="max-w-4xl mx-auto px-4 py-8">
+          <p className="text-red-400">노트를 찾을 수 없습니다.</p>
+          <button onClick={() => router.push("/notes")} className="mt-4 text-sm text-[var(--color-primary)] hover:underline">
+            &larr; Back to Notes
+          </button>
+        </main>
+      </AuthGuard>
+    );
+  }
+
+  return (
+    <AuthGuard>
+      <NavBar />
+      <main className="max-w-4xl mx-auto px-4 py-8">
+        <button
+          onClick={() => router.push("/notes")}
+          className="text-sm text-[var(--color-text-muted)] hover:text-[var(--color-primary)] mb-4 inline-block"
+        >
+          &larr; Back to Notes
+        </button>
+
+        {/* 헤더 */}
+        <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)] mb-6">
+          <div className="flex items-center gap-2 mb-3">
+            <span className={`text-xs px-2 py-0.5 rounded ${
+              note.NOTE_TYPE === "TRANSCRIBING" ? "bg-yellow-500/20 text-yellow-400" :
+              note.NOTE_TYPE === "AUDIO_FAILED" ? "bg-red-500/20 text-red-400" :
+              note.NOTE_TYPE === "AUDIO" ? "bg-purple-500/20 text-purple-400" : "bg-blue-500/20 text-blue-400"
+            }`}>
+              {note.NOTE_TYPE === "TRANSCRIBING" ? "변환 중..." :
+               note.NOTE_TYPE === "AUDIO_FAILED" ? "변환 실패" :
+               note.NOTE_TYPE === "AUDIO" ? "음성" : "텍스트"}
+            </span>
+            {note.CATEGORY_PATH && (
+              <span className="text-xs px-1.5 py-0.5 rounded bg-[var(--color-primary)]/10 text-[var(--color-primary)]">
+                {note.CATEGORY_PATH}
+              </span>
+            )}
+          </div>
+
+          {editing ? (
+            <input
+              type="text"
+              value={editTitle}
+              onChange={(e) => setEditTitle(e.target.value)}
+              className="w-full px-3 py-1 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] focus:border-[var(--color-primary)] focus:outline-none text-xl font-bold mb-2"
+            />
+          ) : (
+            <h1 className="text-xl font-bold mb-2">{note.TITLE || "제목 없음"}</h1>
+          )}
+
+          <div className="flex gap-4 text-xs text-[var(--color-text-muted)]">
+            <span>생성: {new Date(note.CREATED_AT).toLocaleString("ko-KR")}</span>
+            <span>수정: {new Date(note.UPDATED_AT).toLocaleString("ko-KR")}</span>
+          </div>
+        </div>
+
+        {/* 변환 중 인디케이터 */}
+        {note.NOTE_TYPE === "TRANSCRIBING" && (
+          <div className="bg-yellow-500/10 border border-yellow-500/30 rounded-xl p-4 mb-6 flex items-center gap-3">
+            <div className="w-4 h-4 border-2 border-yellow-400 border-t-transparent rounded-full animate-spin" />
+            <span className="text-sm text-yellow-400">음성 변환 중입니다. 이 페이지에서 실시간으로 진행 상태를 확인할 수 있습니다.</span>
+          </div>
+        )}
+
+        {/* 내용 */}
+        <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)] mb-6">
+          {editing ? (
+            <textarea
+              value={editContent}
+              onChange={(e) => setEditContent(e.target.value)}
+              rows={20}
+              className="w-full px-3 py-2 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] focus:border-[var(--color-primary)] focus:outline-none resize-y font-mono text-sm"
+            />
+          ) : (
+            <div className="text-sm leading-relaxed">
+              <ReactMarkdown
+                components={{
+                  h1: ({children}) => <h1 className="text-xl font-bold mt-6 mb-3">{children}</h1>,
+                  h2: ({children}) => <h2 className="text-lg font-bold mt-5 mb-2">{children}</h2>,
+                  h3: ({children}) => <h3 className="text-base font-bold mt-4 mb-2">{children}</h3>,
+                  p: ({children, node}) => {
+                    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+                    const txt = node?.children?.map((c: any) => c.type === 'text' ? c.value : '').join('') || '';
+                    return <p className="mb-3"><SpeakableText text={txt}>{children}</SpeakableText></p>;
+                  },
+                  ul: ({children}) => <ul className="list-disc ml-5 mb-3 space-y-1">{children}</ul>,
+                  ol: ({children}) => <ol className="list-decimal ml-5 mb-3 space-y-1">{children}</ol>,
+                  li: ({children, node}) => {
+                    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+                    const txt = node?.children?.map((c: any) => c.type === 'text' ? c.value : '').join('') || '';
+                    return <li className="leading-relaxed"><SpeakableText text={txt}>{children}</SpeakableText></li>;
+                  },
+                  strong: ({children}) => <strong className="font-bold">{children}</strong>,
+                  blockquote: ({children}) => <blockquote className="border-l-2 border-[var(--color-primary)] pl-4 my-3 italic text-[var(--color-text-muted)]">{children}</blockquote>,
+                }}
+              >
+                {note.CONTENT || "내용 없음"}
+              </ReactMarkdown>
+            </div>
+          )}
+        </div>
+
+        {/* 원본 텍스트 (STT raw) */}
+        {note.RAW_CONTENT && (
+          <div className="mb-6">
+            <button
+              onClick={() => setShowRaw(!showRaw)}
+              className="text-sm text-[var(--color-text-muted)] hover:text-[var(--color-primary)] mb-2"
+            >
+              {showRaw ? "▼ 원본 텍스트 숨기기" : "▶ STT 원본 텍스트 보기"}
+            </button>
+            {showRaw && (
+              <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)] opacity-70">
+                <p className="text-xs text-[var(--color-text-muted)] mb-2">음성 인식 원본 (교정 전)</p>
+                <p className="text-sm whitespace-pre-wrap">{note.RAW_CONTENT}</p>
+              </div>
+            )}
+          </div>
+        )}
+
+        {/* 액션 */}
+        <div className="flex items-center gap-4">
+          {editing ? (
+            <>
+              <button
+                onClick={handleSave}
+                disabled={saving}
+                className="px-4 py-2 text-sm bg-[var(--color-primary)] rounded-lg disabled:opacity-40"
+              >
+                {saving ? "저장 중..." : "저장"}
+              </button>
+              <button
+                onClick={() => { setEditing(false); setEditTitle(note.TITLE || ""); setEditContent(note.CONTENT || ""); }}
+                className="px-4 py-2 text-sm bg-[var(--color-bg-hover)] border border-[var(--color-border)] rounded-lg"
+              >
+                취소
+              </button>
+            </>
+          ) : (
+            <>
+              <button
+                onClick={() => setEditing(true)}
+                className="text-sm text-[var(--color-primary)] hover:underline"
+              >
+                편집
+              </button>
+              <button
+                onClick={async () => {
+                  setPolishing(true);
+                  try {
+                    await request({ method: "POST", url: `/api/notes/${id}/polish` });
+                    await fetchNote();
+                  } catch (err) {
+                    console.error("Failed to polish:", err);
+                    alert("교정/요약에 실패했습니다.");
+                  } finally {
+                    setPolishing(false);
+                  }
+                }}
+                disabled={polishing || note.NOTE_TYPE === "TRANSCRIBING"}
+                className="text-sm text-[var(--color-primary)] hover:underline disabled:opacity-40"
+              >
+                {polishing ? "처리 중..." : "교정/요약"}
+              </button>
+            </>
+          )}
+          <button
+            onClick={handleDelete}
+            disabled={deleting}
+            className="text-sm text-red-400 hover:text-red-300 disabled:opacity-40"
+          >
+            {deleting ? "삭제 중..." : "삭제"}
+          </button>
+        </div>
+      </main>
+    </AuthGuard>
+  );
+}
--- a/sundol-frontend/src/app/notes/new/page.tsx
+++ b/sundol-frontend/src/app/notes/new/page.tsx
@@ -0,0 +1,166 @@
+"use client";
+
+import { useState, useRef, Suspense } from "react";
+import { useRouter, useSearchParams } from "next/navigation";
+import AuthGuard from "@/components/auth-guard";
+import NavBar from "@/components/nav-bar";
+import { useApi } from "@/lib/use-api";
+
+export default function NewNotePageWrapper() {
+  return (
+    <Suspense fallback={<div className="p-8 text-center">Loading...</div>}>
+      <NewNotePage />
+    </Suspense>
+  );
+}
+
+function NewNotePage() {
+  const { request } = useApi();
+  const router = useRouter();
+  const searchParams = useSearchParams();
+  const isAudio = searchParams.get("type") === "audio";
+
+  const [title, setTitle] = useState("");
+  const [content, setContent] = useState("");
+  const [saving, setSaving] = useState(false);
+  const [audioFile, setAudioFile] = useState<File | null>(null);
+  const [transcribing, setTranscribing] = useState(false);
+  const [transcription, setTranscription] = useState("");
+  const fileInputRef = useRef<HTMLInputElement>(null);
+
+  const handleSaveText = async () => {
+    if (!title.trim() && !content.trim()) return;
+    setSaving(true);
+    try {
+      await request({ method: "POST", url: "/api/notes", data: { title, content } });
+      router.push("/notes");
+    } catch (err) {
+      console.error("Failed to save note:", err);
+      alert("노트 저장에 실패했습니다.");
+    } finally {
+      setSaving(false);
+    }
+  };
+
+  const handleUploadAudio = async () => {
+    if (!audioFile) return;
+    setTranscribing(true);
+    try {
+      const formData = new FormData();
+      formData.append("file", audioFile);
+      if (title.trim()) formData.append("title", title);
+
+      const result = await request<{ id: string; transcription: string }>({
+        method: "POST",
+        url: "/api/notes/audio",
+        data: formData,
+        headers: { "Content-Type": "multipart/form-data" },
+      });
+      setTranscription(result.transcription);
+      router.push(`/notes/${result.id}`);
+    } catch (err) {
+      console.error("Failed to transcribe audio:", err);
+      alert("음성 변환에 실패했습니다.");
+    } finally {
+      setTranscribing(false);
+    }
+  };
+
+  return (
+    <AuthGuard>
+      <NavBar />
+      <main className="max-w-4xl mx-auto px-4 py-8">
+        <button
+          onClick={() => router.push("/notes")}
+          className="text-sm text-[var(--color-text-muted)] hover:text-[var(--color-primary)] mb-4 inline-block"
+        >
+          &larr; Back to Notes
+        </button>
+
+        <h1 className="text-2xl font-bold mb-6">
+          {isAudio ? "음성 노트 작성" : "텍스트 노트 작성"}
+        </h1>
+
+        <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)] space-y-4">
+          {/* 제목 */}
+          <div>
+            <label className="block text-sm text-[var(--color-text-muted)] mb-1">제목</label>
+            <input
+              type="text"
+              value={title}
+              onChange={(e) => setTitle(e.target.value)}
+              placeholder={isAudio ? "자동 생성됩니다 (선택)" : "노트 제목"}
+              className="w-full px-3 py-2 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] focus:border-[var(--color-primary)] focus:outline-none"
+            />
+          </div>
+
+          {isAudio ? (
+            /* 음성 업로드 */
+            <div>
+              <label className="block text-sm text-[var(--color-text-muted)] mb-1">음성 파일</label>
+              <input
+                ref={fileInputRef}
+                type="file"
+                accept="audio/*"
+                onChange={(e) => setAudioFile(e.target.files?.[0] || null)}
+                className="hidden"
+              />
+              <div
+                onClick={() => fileInputRef.current?.click()}
+                className="border-2 border-dashed border-[var(--color-border)] rounded-lg p-8 text-center cursor-pointer hover:border-[var(--color-primary)] transition-colors"
+              >
+                {audioFile ? (
+                  <div>
+                    <p className="font-medium">{audioFile.name}</p>
+                    <p className="text-sm text-[var(--color-text-muted)] mt-1">
+                      {(audioFile.size / 1024 / 1024).toFixed(1)} MB
+                    </p>
+                  </div>
+                ) : (
+                  <div>
+                    <p className="text-[var(--color-text-muted)]">클릭하여 음성 파일을 선택하세요</p>
+                    <p className="text-xs text-[var(--color-text-muted)] mt-1">MP3, WAV, M4A, OGG, WebM</p>
+                  </div>
+                )}
+              </div>
+
+              {transcription && (
+                <div className="mt-4 p-4 bg-[var(--color-bg-hover)] rounded-lg">
+                  <p className="text-sm text-[var(--color-text-muted)] mb-2">변환 결과:</p>
+                  <p className="text-sm whitespace-pre-wrap">{transcription}</p>
+                </div>
+              )}
+
+              <button
+                onClick={handleUploadAudio}
+                disabled={!audioFile || transcribing}
+                className="mt-4 px-6 py-2 bg-[var(--color-primary)] hover:bg-[var(--color-primary-hover)] rounded-lg transition-colors disabled:opacity-40"
+              >
+                {transcribing ? "변환 중..." : "음성 변환 및 저장"}
+              </button>
+            </div>
+          ) : (
+            /* 텍스트 입력 */
+            <div>
+              <label className="block text-sm text-[var(--color-text-muted)] mb-1">내용 (Markdown)</label>
+              <textarea
+                value={content}
+                onChange={(e) => setContent(e.target.value)}
+                placeholder="노트 내용을 입력하세요..."
+                rows={15}
+                className="w-full px-3 py-2 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] focus:border-[var(--color-primary)] focus:outline-none resize-y font-mono text-sm"
+              />
+              <button
+                onClick={handleSaveText}
+                disabled={saving || (!title.trim() && !content.trim())}
+                className="mt-4 px-6 py-2 bg-[var(--color-primary)] hover:bg-[var(--color-primary-hover)] rounded-lg transition-colors disabled:opacity-40"
+              >
+                {saving ? "저장 중..." : "저장"}
+              </button>
+            </div>
+          )}
+        </div>
+      </main>
+    </AuthGuard>
+  );
+}
--- a/sundol-frontend/src/app/notes/page.tsx
+++ b/sundol-frontend/src/app/notes/page.tsx
@@ -0,0 +1,104 @@
+"use client";
+
+import { useEffect, useState } from "react";
+import Link from "next/link";
+import AuthGuard from "@/components/auth-guard";
+import NavBar from "@/components/nav-bar";
+import { useApi } from "@/lib/use-api";
+
+interface Note {
+  ID: string;
+  TITLE: string;
+  NOTE_TYPE: string;
+  CATEGORY_PATH: string | null;
+  CREATED_AT: string;
+  UPDATED_AT: string;
+}
+
+export default function NotesPage() {
+  const { request } = useApi();
+  const [notes, setNotes] = useState<Note[]>([]);
+  const [loading, setLoading] = useState(true);
+
+  useEffect(() => {
+    (async () => {
+      try {
+        const data = await request<Note[]>({ method: "GET", url: "/api/notes" });
+        setNotes(data);
+      } catch (err) {
+        console.error("Failed to load notes:", err);
+      } finally {
+        setLoading(false);
+      }
+    })();
+  }, []);
+
+  return (
+    <AuthGuard>
+      <NavBar />
+      <main className="max-w-4xl mx-auto px-4 py-8">
+        <div className="flex justify-between items-center mb-6">
+          <h1 className="text-2xl font-bold">Notes</h1>
+          <div className="flex gap-2">
+            <Link
+              href="/notes/new"
+              className="px-4 py-2 bg-[var(--color-primary)] hover:bg-[var(--color-primary-hover)] rounded-lg transition-colors text-sm"
+            >
+              + 텍스트 노트
+            </Link>
+            <Link
+              href="/notes/new?type=audio"
+              className="px-4 py-2 bg-[var(--color-bg-card)] border border-[var(--color-border)] hover:border-[var(--color-primary)] rounded-lg transition-colors text-sm"
+            >
+              + 음성 노트
+            </Link>
+          </div>
+        </div>
+
+        {loading ? (
+          <p className="text-[var(--color-text-muted)]">Loading...</p>
+        ) : notes.length === 0 ? (
+          <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)]">
+            <p className="text-[var(--color-text-muted)]">아직 노트가 없습니다. 첫 노트를 작성해보세요.</p>
+          </div>
+        ) : (
+          <div className="space-y-3">
+            {notes.map((note) => (
+              <Link
+                key={note.ID}
+                href={`/notes/${note.ID}`}
+                className="block bg-[var(--color-bg-card)] rounded-xl p-4 border border-[var(--color-border)] hover:border-[var(--color-primary)] transition-colors"
+              >
+                <div className="flex items-center justify-between">
+                  <div className="flex-1 min-w-0">
+                    <div className="flex items-center gap-2 mb-1">
+                      <span className={`text-xs px-2 py-0.5 rounded ${
+                        note.NOTE_TYPE === "TRANSCRIBING" ? "bg-yellow-500/20 text-yellow-400" :
+                        note.NOTE_TYPE === "AUDIO_FAILED" ? "bg-red-500/20 text-red-400" :
+                        note.NOTE_TYPE === "AUDIO" ? "bg-purple-500/20 text-purple-400" :
+                        "bg-blue-500/20 text-blue-400"
+                      }`}>
+                        {note.NOTE_TYPE === "TRANSCRIBING" ? "변환 중..." :
+                         note.NOTE_TYPE === "AUDIO_FAILED" ? "변환 실패" :
+                         note.NOTE_TYPE === "AUDIO" ? "음성" : "텍스트"}
+                      </span>
+                      {note.CATEGORY_PATH && (
+                        <span className="text-xs px-1.5 py-0.5 rounded bg-[var(--color-primary)]/10 text-[var(--color-primary)]">
+                          {note.CATEGORY_PATH}
+                        </span>
+                      )}
+                    </div>
+                    <h3 className="font-medium truncate">{note.TITLE || "제목 없음"}</h3>
+                  </div>
+                  <span className="text-sm text-[var(--color-text-muted)] ml-4 whitespace-nowrap">
+                    {new Date(note.CREATED_AT).toLocaleDateString()}
+                  </span>
+                </div>
+              </Link>
+            ))}
+          </div>
+        )}
+      </main>
+    </AuthGuard>
+  );
+}
--- a/sundol-frontend/src/app/tts/page.tsx
+++ b/sundol-frontend/src/app/tts/page.tsx
@@ -0,0 +1,317 @@
+"use client";
+
+import { useState, useRef, useEffect } from "react";
+import AuthGuard from "@/components/auth-guard";
+import NavBar from "@/components/nav-bar";
+
+interface VoiceProfile {
+  id: string;
+  name: string;
+  ref_text?: string;
+}
+
+export default function TTSPage() {
+  // 녹음
+  const [isRecording, setIsRecording] = useState(false);
+  const [recordedBlob, setRecordedBlob] = useState<Blob | null>(null);
+  const [recordedUrl, setRecordedUrl] = useState<string | null>(null);
+  const [uploadedFile, setUploadedFile] = useState<File | null>(null);
+  const mediaRecorderRef = useRef<MediaRecorder | null>(null);
+  const chunksRef = useRef<Blob[]>([]);
+
+  // 프로필
+  const [profiles, setProfiles] = useState<VoiceProfile[]>([]);
+  const [selectedProfile, setSelectedProfile] = useState<string>("");
+  const [profileName, setProfileName] = useState("");
+  const [refText, setRefText] = useState("");
+  const [registering, setRegistering] = useState(false);
+
+  // TTS
+  const [text, setText] = useState("");
+  const [language, setLanguage] = useState("korean");
+  const [generating, setGenerating] = useState(false);
+  const [outputUrl, setOutputUrl] = useState<string | null>(null);
+  const [error, setError] = useState<string | null>(null);
+  const [serverStatus, setServerStatus] = useState("checking...");
+
+  // 탭
+  const [tab, setTab] = useState<"generate" | "register">("generate");
+
+  useEffect(() => {
+    fetch("/api/tts/health").then(r => r.json())
+      .then(d => setServerStatus(d.model_loaded ? "ready" : "loading..."))
+      .catch(() => setServerStatus("offline"));
+    fetchProfiles();
+  }, []);
+
+  const fetchProfiles = () => {
+    // 캐시 먼저
+    const cached = localStorage.getItem("tts_profiles");
+    if (cached) {
+      try {
+        const data = JSON.parse(cached);
+        setProfiles(data);
+        if (data.length > 0 && !selectedProfile) setSelectedProfile(data[0].id);
+      } catch {}
+    }
+    fetch("/api/tts/profiles").then(r => r.json())
+      .then(data => {
+        setProfiles(data);
+        localStorage.setItem("tts_profiles", JSON.stringify(data));
+        if (data.length > 0 && !selectedProfile) setSelectedProfile(data[0].id);
+      }).catch(() => {});
+  };
+
+  const startRecording = async () => {
+    try {
+      const stream = await navigator.mediaDevices.getUserMedia({ audio: true });
+      const mr = new MediaRecorder(stream, { mimeType: "audio/webm" });
+      mediaRecorderRef.current = mr;
+      chunksRef.current = [];
+      mr.ondataavailable = (e) => { if (e.data.size > 0) chunksRef.current.push(e.data); };
+      mr.onstop = () => {
+        const blob = new Blob(chunksRef.current, { type: "audio/webm" });
+        setRecordedBlob(blob);
+        setRecordedUrl(URL.createObjectURL(blob));
+        setUploadedFile(null);
+        stream.getTracks().forEach(t => t.stop());
+      };
+      mr.start();
+      setIsRecording(true);
+    } catch (err) {
+      setError("마이크 접근 실패");
+    }
+  };
+
+  const stopRecording = () => { mediaRecorderRef.current?.stop(); setIsRecording(false); };
+
+  const handleFileUpload = (e: React.ChangeEvent<HTMLInputElement>) => {
+    const file = e.target.files?.[0];
+    if (file) { setUploadedFile(file); setRecordedBlob(null); setRecordedUrl(URL.createObjectURL(file)); }
+  };
+
+  // 프로필 등록
+  const handleRegister = async () => {
+    const audio = uploadedFile || recordedBlob;
+    if (!audio || !profileName.trim()) return;
+    setRegistering(true);
+    setError(null);
+    try {
+      const fd = new FormData();
+      fd.append("name", profileName);
+      fd.append("ref_audio", audio, uploadedFile?.name || "recording.webm");
+      if (refText.trim()) fd.append("ref_text", refText);
+      const res = await fetch("/api/tts/profiles", { method: "POST", body: fd });
+      if (!res.ok) throw new Error(await res.text());
+      const result = await res.json();
+      setProfileName("");
+      setRefText("");
+      setRecordedBlob(null);
+      setRecordedUrl(null);
+      setUploadedFile(null);
+      fetchProfiles();
+      localStorage.removeItem("tts_profiles"); // 캐시 강제 갱신
+      setSelectedProfile(result.id);
+      setTab("generate");
+    } catch (err) {
+      setError("프로필 등록 실패: " + (err instanceof Error ? err.message : ""));
+    } finally {
+      setRegistering(false);
+    }
+  };
+
+  // 프로필 삭제
+  const handleDeleteProfile = async (id: string) => {
+    if (!confirm("삭제하시겠습니까?")) return;
+    await fetch(`/api/tts/profiles/${id}`, { method: "DELETE" });
+    fetchProfiles();
+    if (selectedProfile === id) setSelectedProfile("");
+  };
+
+  // TTS 생성 (프로필 기반)
+  const handleGenerate = async () => {
+    if (!text.trim() || !selectedProfile) return;
+    setGenerating(true);
+    setError(null);
+    setOutputUrl(null);
+    try {
+      const fd = new FormData();
+      fd.append("text", text);
+      fd.append("profile_id", selectedProfile);
+      fd.append("language", language);
+      const res = await fetch("/api/tts/speak", { method: "POST", body: fd });
+      if (!res.ok) throw new Error(`HTTP ${res.status}`);
+      const blob = await res.blob();
+      if (blob.size < 100) throw new Error("Empty audio");
+      setOutputUrl(URL.createObjectURL(blob));
+    } catch (err) {
+      setError("생성 실패: " + (err instanceof Error ? err.message : ""));
+    } finally {
+      setGenerating(false);
+    }
+  };
+
+  return (
+    <AuthGuard>
+      <NavBar />
+      <main className="max-w-4xl mx-auto px-4 py-8">
+        <div className="flex justify-between items-center mb-6">
+          <h1 className="text-2xl font-bold">Voice Clone (TTS)</h1>
+          <span className={`text-xs px-2 py-1 rounded ${
+            serverStatus === "ready" ? "bg-green-500/20 text-green-400" :
+            serverStatus === "offline" ? "bg-red-500/20 text-red-400" :
+            "bg-yellow-500/20 text-yellow-400"
+          }`}>{serverStatus}</span>
+        </div>
+
+        {/* 탭 */}
+        <div className="flex gap-2 mb-6">
+          <button onClick={() => setTab("generate")}
+            className={`px-4 py-2 text-sm rounded-lg ${tab === "generate" ? "bg-[var(--color-primary)] text-white" : "bg-[var(--color-bg-card)] border border-[var(--color-border)]"}`}>
+            음성 생성
+          </button>
+          <button onClick={() => setTab("register")}
+            className={`px-4 py-2 text-sm rounded-lg ${tab === "register" ? "bg-[var(--color-primary)] text-white" : "bg-[var(--color-bg-card)] border border-[var(--color-border)]"}`}>
+            음성 프로필 등록
+          </button>
+        </div>
+
+        {tab === "register" ? (
+          /* 프로필 등록 */
+          <div className="space-y-6">
+            <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)]">
+              <h2 className="text-lg font-semibold mb-4">음성 프로필 등록</h2>
+              <p className="text-sm text-[var(--color-text-muted)] mb-4">
+                15~30초 분량의 깨끗한 음성을 녹음하거나 파일을 업로드하세요.
+              </p>
+
+              <div className="space-y-4">
+                <div>
+                  <label className="block text-sm text-[var(--color-text-muted)] mb-1">프로필 이름</label>
+                  <input type="text" value={profileName} onChange={e => setProfileName(e.target.value)}
+                    placeholder="예: 내 목소리"
+                    className="w-full px-3 py-2 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] focus:border-[var(--color-primary)] focus:outline-none text-sm" />
+                </div>
+
+                <div className="flex gap-3">
+                  {isRecording ? (
+                    <button onClick={stopRecording}
+                      className="px-4 py-2 bg-red-500 hover:bg-red-600 rounded-lg text-sm flex items-center gap-2">
+                      <span className="w-3 h-3 bg-white rounded-full animate-pulse" /> 녹음 중지
+                    </button>
+                  ) : (
+                    <button onClick={startRecording}
+                      className="px-4 py-2 bg-[var(--color-primary)] hover:bg-[var(--color-primary-hover)] rounded-lg text-sm">
+                      마이크 녹음
+                    </button>
+                  )}
+                  <label className="px-4 py-2 bg-[var(--color-bg-hover)] border border-[var(--color-border)] rounded-lg text-sm cursor-pointer hover:border-[var(--color-primary)]">
+                    파일 업로드
+                    <input type="file" accept="audio/*" onChange={handleFileUpload} className="hidden" />
+                  </label>
+                </div>
+
+                {recordedUrl && (
+                  <audio controls src={recordedUrl} className="w-full" />
+                )}
+
+                <div>
+                  <label className="block text-sm text-[var(--color-text-muted)] mb-1">참조 텍스트 (선택 - 정확도 향상)</label>
+                  <input type="text" value={refText} onChange={e => setRefText(e.target.value)}
+                    placeholder="녹음에서 말한 내용"
+                    className="w-full px-3 py-2 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] focus:border-[var(--color-primary)] focus:outline-none text-sm" />
+                </div>
+
+                <button onClick={handleRegister}
+                  disabled={registering || !profileName.trim() || !(uploadedFile || recordedBlob)}
+                  className="px-6 py-2 bg-[var(--color-primary)] hover:bg-[var(--color-primary-hover)] rounded-lg disabled:opacity-40">
+                  {registering ? "등록 중..." : "프로필 등록"}
+                </button>
+              </div>
+            </div>
+
+            {/* 등록된 프로필 목록 */}
+            {profiles.length > 0 && (
+              <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)]">
+                <h2 className="text-lg font-semibold mb-4">등록된 프로필</h2>
+                <div className="space-y-2">
+                  {profiles.map(p => (
+                    <div key={p.id} className="flex items-center justify-between p-3 bg-[var(--color-bg-hover)] rounded-lg">
+                      <span className="text-sm font-medium">{p.name}</span>
+                      <button onClick={() => handleDeleteProfile(p.id)}
+                        className="text-xs text-red-400 hover:text-red-300">삭제</button>
+                    </div>
+                  ))}
+                </div>
+              </div>
+            )}
+          </div>
+        ) : (
+          /* 음성 생성 */
+          <div className="space-y-6">
+            {/* 프로필 선택 */}
+            <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)]">
+              <h2 className="text-lg font-semibold mb-4">1. 음성 프로필 선택</h2>
+              {profiles.length === 0 ? (
+                <p className="text-sm text-[var(--color-text-muted)]">
+                  등록된 프로필이 없습니다.{" "}
+                  <button onClick={() => setTab("register")} className="text-[var(--color-primary)] hover:underline">
+                    프로필 등록하기
+                  </button>
+                </p>
+              ) : (
+                <div className="flex flex-wrap gap-2">
+                  {profiles.map(p => (
+                    <button key={p.id} onClick={() => setSelectedProfile(p.id)}
+                      className={`px-4 py-2 text-sm rounded-lg transition-colors ${
+                        selectedProfile === p.id
+                          ? "bg-[var(--color-primary)] text-white"
+                          : "bg-[var(--color-bg-hover)] border border-[var(--color-border)] hover:border-[var(--color-primary)]"
+                      }`}>
+                      {p.name}
+                    </button>
+                  ))}
+                </div>
+              )}
+            </div>
+
+            {/* 텍스트 입력 */}
+            <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)]">
+              <h2 className="text-lg font-semibold mb-4">2. 읽을 텍스트</h2>
+              <select value={language} onChange={e => setLanguage(e.target.value)}
+                className="px-3 py-2 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] text-sm mb-3">
+                <option value="korean">한국어</option>
+                <option value="english">English</option>
+                <option value="japanese">日本語</option>
+                <option value="chinese">中文</option>
+              </select>
+              <textarea value={text} onChange={e => setText(e.target.value)}
+                placeholder="음성으로 변환할 텍스트를 입력하세요..." rows={5}
+                className="w-full px-3 py-2 rounded-lg bg-[var(--color-bg-hover)] border border-[var(--color-border)] focus:border-[var(--color-primary)] focus:outline-none text-sm resize-y" />
+            </div>
+
+            {/* 생성 */}
+            <button onClick={handleGenerate}
+              disabled={generating || !text.trim() || !selectedProfile || serverStatus !== "ready"}
+              className="w-full py-3 bg-[var(--color-primary)] hover:bg-[var(--color-primary-hover)] rounded-xl text-lg font-semibold disabled:opacity-40">
+              {generating ? "생성 중..." : "음성 생성"}
+            </button>
+
+            {error && (
+              <div className="bg-red-500/10 border border-red-500/30 rounded-xl p-4 text-sm text-red-400">{error}</div>
+            )}
+
+            {outputUrl && (
+              <div className="bg-[var(--color-bg-card)] rounded-xl p-6 border border-[var(--color-border)]">
+                <h2 className="text-lg font-semibold mb-4">생성 결과</h2>
+                <audio controls src={outputUrl} className="w-full mb-3" />
+                <a href={outputUrl} download="tts_output.wav"
+                  className="text-sm text-[var(--color-primary)] hover:underline">다운로드</a>
+              </div>
+            )}
+          </div>
+        )}
+      </main>
+    </AuthGuard>
+  );
+}
--- a/sundol-frontend/src/components/nav-bar.tsx
+++ b/sundol-frontend/src/components/nav-bar.tsx
@@ -7,10 +7,12 @@ import { useAuth } from "@/lib/auth-context";
 const navItems = [
  { href: "/dashboard", label: "Dashboard" },
  { href: "/knowledge", label: "Knowledge" },
+  { href: "/notes", label: "Notes" },
  { href: "/chat", label: "Chat" },
  { href: "/study", label: "Study" },
  { href: "/todos", label: "Todos" },
  { href: "/habits", label: "Habits" },
+  { href: "/tts", label: "TTS" },
  { href: "/settings", label: "Settings" },
 ];

--- a/sundol-frontend/src/components/speakable-text.tsx
+++ b/sundol-frontend/src/components/speakable-text.tsx
@@ -0,0 +1,85 @@
+"use client";
+
+import { useState, useRef, useEffect } from "react";
+
+interface SpeakableProps {
+  children: React.ReactNode;
+  text: string;
+}
+
+let cachedProfileId: string | null = null;
+let profileChecked = false;
+
+export default function SpeakableText({ children, text }: SpeakableProps) {
+  const [playing, setPlaying] = useState(false);
+  const [loading, setLoading] = useState(false);
+  const [hasProfile, setHasProfile] = useState(false);
+  const audioRef = useRef<HTMLAudioElement | null>(null);
+
+  useEffect(() => {
+    if (profileChecked) {
+      setHasProfile(!!cachedProfileId);
+      return;
+    }
+    try {
+      const profiles = JSON.parse(localStorage.getItem("tts_profiles") || "[]");
+      if (profiles.length > 0) {
+        cachedProfileId = profiles[0].id;
+        setHasProfile(true);
+      }
+      profileChecked = true;
+    } catch {}
+  }, []);
+
+  const handleSpeak = async (e: React.MouseEvent) => {
+    e.preventDefault();
+    e.stopPropagation();
+
+    if (playing) {
+      audioRef.current?.pause();
+      setPlaying(false);
+      return;
+    }
+
+    if (!cachedProfileId || text.length < 5) return;
+
+    setLoading(true);
+    try {
+      const fd = new FormData();
+      fd.append("text", text);
+      fd.append("profile_id", cachedProfileId);
+      fd.append("language", "Korean");
+      const res = await fetch("/api/tts/speak", { method: "POST", body: fd });
+      if (!res.ok) { setLoading(false); return; }
+      const blob = await res.blob();
+      if (blob.size < 200) { setLoading(false); return; }
+
+      const url = URL.createObjectURL(blob);
+      const audio = new Audio(url);
+      audioRef.current = audio;
+      audio.onended = () => setPlaying(false);
+      setPlaying(true);
+      setLoading(false);
+      audio.play();
+    } catch {
+      setLoading(false);
+    }
+  };
+
+  if (!hasProfile || text.length < 5) return <>{children}</>;
+
+  return (
+    <>
+      {children}
+      <button
+        onClick={handleSpeak}
+        disabled={loading}
+        className="inline-flex items-center ml-1 text-[var(--color-text-muted)] hover:text-[var(--color-primary)] disabled:opacity-30 align-middle"
+        title={playing ? "중지" : "읽어주기"}
+        style={{ fontSize: "0.85em", verticalAlign: "middle", cursor: "pointer" }}
+      >
+        {loading ? "⏳" : playing ? "⏹" : "🔊"}
+      </button>
+    </>
+  );
+}
--- a/sundol-frontend/src/components/tts-reader.tsx
+++ b/sundol-frontend/src/components/tts-reader.tsx
@@ -0,0 +1,159 @@
+"use client";
+
+import { useState, useEffect, useRef } from "react";
+
+interface TTSReaderProps {
+  text: string;
+}
+
+interface VoiceProfile {
+  id: string;
+  name: string;
+}
+
+export default function TTSReader({ text }: TTSReaderProps) {
+  const [profiles, setProfiles] = useState<VoiceProfile[]>([]);
+  const [selectedProfile, setSelectedProfile] = useState("");
+  const [generating, setGenerating] = useState(false);
+  const [playing, setPlaying] = useState(false);
+  const [progress, setProgress] = useState("");
+  const audioRef = useRef<HTMLAudioElement | null>(null);
+  const stoppedRef = useRef(false);
+  const audioUrlsRef = useRef<string[]>([]);
+
+  useEffect(() => {
+    // localStorage 캐시
+    const cached = localStorage.getItem("tts_profiles");
+    if (cached) {
+      try {
+        const data = JSON.parse(cached);
+        setProfiles(data);
+        if (data.length > 0) setSelectedProfile(data[0].id);
+      } catch {}
+    }
+    // 백그라운드에서 갱신 (블록 안 됨)
+    fetch("/api/tts/profiles").then(r => r.json()).then(data => {
+      setProfiles(data);
+      if (data.length > 0 && !selectedProfile) setSelectedProfile(data[0].id);
+      localStorage.setItem("tts_profiles", JSON.stringify(data));
+    }).catch(() => {});
+  }, []);
+
+  const toSentences = (md: string): string[] => {
+    return md
+      .replace(/^#+\s+.*$/gm, "")
+      .replace(/\*\*/g, "")
+      .replace(/^[-*]\s+/gm, "")
+      .replace(/^>\s+/gm, "")
+      .replace(/---+/g, "")
+      .replace(/\[([^\]]+)\]\([^)]+\)/g, "$1")
+      .split("\n")
+      .map(s => s.trim())
+      .filter(s => s.length >= 10);
+  };
+
+  // 직접 동기 호출 — 바로 wav 반환
+  const speak = async (chunk: string): Promise<string | null> => {
+    const fd = new FormData();
+    fd.append("text", chunk);
+    fd.append("profile_id", selectedProfile);
+    fd.append("language", "Korean");
+    const res = await fetch("/api/tts/speak", { method: "POST", body: fd });
+    if (!res.ok) return null;
+    const blob = await res.blob();
+    return blob.size > 100 ? URL.createObjectURL(blob) : null;
+  };
+
+  const handleGenerate = async () => {
+    if (!selectedProfile || !text.trim()) return;
+    setGenerating(true);
+    setPlaying(true);
+    stoppedRef.current = false;
+    audioUrlsRef.current = [];
+
+    const sentences = toSentences(text);
+    let isAudioPlaying = false;
+    let playIdx = 0;
+
+    const playNext = () => {
+      if (stoppedRef.current) return;
+      if (playIdx >= audioUrlsRef.current.length) { isAudioPlaying = false; return; }
+      isAudioPlaying = true;
+      const a = new Audio(audioUrlsRef.current[playIdx++]);
+      audioRef.current = a;
+      a.onended = () => {
+        if (stoppedRef.current) return;
+        playIdx < audioUrlsRef.current.length ? playNext() : (isAudioPlaying = false);
+      };
+      a.play();
+    };
+
+    for (let i = 0; i < sentences.length; i++) {
+      if (stoppedRef.current) break;
+      setProgress(`${i + 1}/${sentences.length}`);
+      const url = await speak(sentences[i]);
+      if (url && !stoppedRef.current) {
+        audioUrlsRef.current.push(url);
+        if (!isAudioPlaying) playNext();
+      }
+    }
+
+    setGenerating(false);
+    setProgress("");
+    if (!isAudioPlaying) setPlaying(false);
+  };
+
+  const handleStop = () => {
+    stoppedRef.current = true;
+    audioRef.current?.pause();
+    setPlaying(false);
+    setGenerating(false);
+    setProgress("");
+  };
+
+  const handleReplay = () => {
+    if (audioUrlsRef.current.length === 0) return;
+    stoppedRef.current = false;
+    setPlaying(true);
+    let idx = 0;
+    const play = () => {
+      if (idx >= audioUrlsRef.current.length || stoppedRef.current) { setPlaying(false); return; }
+      const audio = new Audio(audioUrlsRef.current[idx]);
+      audioRef.current = audio;
+      idx++;
+      audio.onended = play;
+      audio.play();
+    };
+    play();
+  };
+
+  if (profiles.length === 0) return null;
+
+  return (
+    <div className="flex items-center gap-2 flex-wrap">
+      <select value={selectedProfile} onChange={e => setSelectedProfile(e.target.value)}
+        className="text-xs px-2 py-1 rounded bg-[var(--color-bg-hover)] border border-[var(--color-border)]">
+        {profiles.map(p => <option key={p.id} value={p.id}>{p.name}</option>)}
+      </select>
+
+      {playing || generating ? (
+        <button onClick={handleStop}
+          className="text-xs px-3 py-1 bg-red-500/20 text-red-400 rounded hover:bg-red-500/30">
+          {progress || "중지"}
+        </button>
+      ) : (
+        <button onClick={handleGenerate} disabled={!selectedProfile}
+          className="text-xs px-3 py-1 bg-[var(--color-primary)]/20 text-[var(--color-primary)] rounded hover:bg-[var(--color-primary)]/30 disabled:opacity-40">
+          읽어주기
+        </button>
+      )}
+
+      {audioUrlsRef.current.length > 0 && !playing && !generating && (
+        <button onClick={handleReplay}
+          className="text-xs px-3 py-1 bg-[var(--color-bg-hover)] border border-[var(--color-border)] rounded">
+          다시 재생
+        </button>
+      )}
+    </div>
+  );
+}
--- a/sundol-frontend/src/lib/api.ts
+++ b/sundol-frontend/src/lib/api.ts
@@ -5,7 +5,7 @@ export const api = axios.create({
  withCredentials: true,
 });

-// --- 공통 토큰 refresh 로직 (mutex 패턴) ---
+// --- refresh 로직 ---

 let isRefreshing = false;
 let pendingQueue: {
@@ -13,7 +13,6 @@ let pendingQueue: {
  reject: (error: unknown) => void;
 }[] = [];

-// auth-context에서 주입하는 콜백
 let onTokenRefreshed: ((token: string) => void) | null = null;
 let onRefreshFailed: (() => void) | null = null;

@@ -27,21 +26,27 @@ export function setAuthCallbacks(

 function processQueue(token: string | null, error: unknown) {
  pendingQueue.forEach(({ resolve, reject }) => {
-    if (token) {
-      resolve(token);
-    } else {
-      reject(error);
-    }
+    if (token) resolve(token);
+    else reject(error);
  });
  pendingQueue = [];
 }

+// 요청 인터셉터: 매 요청마다 localStorage에서 최신 토큰 읽기
+api.interceptors.request.use((config) => {
+  const token = localStorage.getItem("accessToken");
+  if (token) {
+    config.headers["Authorization"] = `Bearer ${token}`;
+  }
+  return config;
+});
+
+// 응답 인터셉터: 401이면 refresh 후 재시도
 api.interceptors.response.use(
  (response) => response,
  async (error: AxiosError) => {
    const originalRequest = error.config as InternalAxiosRequestConfig & { _retry?: boolean };

-    // 401이 아니거나, refresh 요청 자체가 실패한 경우, 이미 retry한 경우 → 그냥 throw
    if (
      error.response?.status !== 401 ||
      originalRequest.url?.includes("/api/auth/") ||
@@ -50,7 +55,6 @@ api.interceptors.response.use(
      return Promise.reject(error);
    }

-    // 이미 refresh 진행 중이면 큐에 대기
    if (isRefreshing) {
      return new Promise((resolve, reject) => {
        pendingQueue.push({
@@ -64,36 +68,25 @@ api.interceptors.response.use(
      });
    }

-    // refresh 시작
    isRefreshing = true;
    originalRequest._retry = true;

-    const attemptRefresh = async (retryCount: number): Promise<string> => {
    try {
-        const res = await api.post<LoginResponse>("/api/auth/refresh");
-        return res.data.accessToken;
-      } catch (err) {
-        const isNetworkError = !((err as AxiosError).response);
-        if (isNetworkError && retryCount < 2) {
-          // 네트워크 에러(서버 재시작 등)면 3초 후 재시도
-          await new Promise((r) => setTimeout(r, 3000));
-          return attemptRefresh(retryCount + 1);
-        }
-        throw err;
-      }
-    };
+      const rt = localStorage.getItem("refreshToken");
+      if (!rt) throw new Error("No refresh token");

-    try {
-      const newToken = await attemptRefresh(0);
+      const res = await api.post<LoginResponse>("/api/auth/refresh", { refreshToken: rt });
+      const newAccess = res.data.accessToken;
+      const newRefresh = res.data.refreshToken;

-      api.defaults.headers.common["Authorization"] = `Bearer ${newToken}`;
-      onTokenRefreshed?.(newToken);
+      localStorage.setItem("accessToken", newAccess);
+      if (newRefresh) localStorage.setItem("refreshToken", newRefresh);
+      api.defaults.headers.common["Authorization"] = `Bearer ${newAccess}`;

-      // 대기 중인 요청들 처리
-      processQueue(newToken, null);
+      onTokenRefreshed?.(newAccess);
+      processQueue(newAccess, null);

-      // 원래 요청 retry
-      originalRequest.headers["Authorization"] = `Bearer ${newToken}`;
+      originalRequest.headers["Authorization"] = `Bearer ${newAccess}`;
      return api.request(originalRequest);
    } catch (refreshError) {
      processQueue(null, refreshError);
--- a/sundol-frontend/src/lib/auth-context.tsx
+++ b/sundol-frontend/src/lib/auth-context.tsx
@@ -1,6 +1,6 @@
 "use client";

-import React, { createContext, useContext, useState, useCallback, useEffect, useRef } from "react";
+import React, { createContext, useContext, useState, useCallback, useEffect } from "react";
 import { api, LoginResponse, setAuthCallbacks } from "./api";

 interface AuthContextType {
@@ -21,93 +21,60 @@ const AuthContext = createContext<AuthContextType>({
  setAccessToken: () => {},
 });

-export function AuthProvider({ children }: { children: React.ReactNode }) {
-  const [accessToken, setAccessTokenState] = useState<string | null>(null);
-  const [isLoading, setIsLoading] = useState(true);
-  const logoutRef = useRef<() => void>(() => {});
+function getStoredToken(): string | null {
+  if (typeof window === "undefined") return null;
+  return localStorage.getItem("accessToken");
+}

-  // localStorage와 동기화하는 setter
-  const setAccessToken = useCallback((token: string | null) => {
-    setAccessTokenState(token);
-    if (token) {
-      localStorage.setItem("accessToken", token);
-    } else {
+export function AuthProvider({ children }: { children: React.ReactNode }) {
+  const [accessToken, setAccessTokenState] = useState<string | null>(getStoredToken);
+  const [isLoading, setIsLoading] = useState(false);
+
+  const saveTokens = useCallback((access: string, refresh?: string) => {
+    setAccessTokenState(access);
+    localStorage.setItem("accessToken", access);
+    if (refresh) localStorage.setItem("refreshToken", refresh);
+    api.defaults.headers.common["Authorization"] = `Bearer ${access}`;
+  }, []);
+
+  const clearTokens = useCallback(() => {
+    setAccessTokenState(null);
    localStorage.removeItem("accessToken");
+    localStorage.removeItem("refreshToken");
+    delete api.defaults.headers.common["Authorization"];
+  }, []);
+
+  const login = useCallback((response: LoginResponse) => {
+    saveTokens(response.accessToken, response.refreshToken);
+  }, [saveTokens]);
+
+  const logout = useCallback(async () => {
+    try { await api.post("/api/auth/logout"); } catch {}
+    clearTokens();
+    window.location.href = "/login";
+  }, [clearTokens]);
+
+  // 인터셉터 콜백: 토큰 갱신 성공/실패 처리
+  useEffect(() => {
+    setAuthCallbacks(
+      (token: string) => {
+        setAccessTokenState(token);
+        localStorage.setItem("accessToken", token);
+      },
+      () => logout()
+    );
+  }, [logout]);
+
+  // 앱 로드 시 localStorage 토큰으로 헤더 설정
+  useEffect(() => {
+    const access = localStorage.getItem("accessToken");
+    if (access) {
+      api.defaults.headers.common["Authorization"] = `Bearer ${access}`;
    }
  }, []);

-  // interceptor 콜백 등록
-  useEffect(() => {
-    setAuthCallbacks(
-      (token: string) => setAccessToken(token),
-      () => logoutRef.current()
-    );
-  }, [setAccessToken]);
-
-  useEffect(() => {
-    const restoreSession = async () => {
-      // 1차: localStorage에서 복원
-      const stored = localStorage.getItem("accessToken");
-      if (stored) {
-        setAccessTokenState(stored);
-        api.defaults.headers.common["Authorization"] = `Bearer ${stored}`;
-        setIsLoading(false);
-        return;
-      }
-
-      // 2차: refresh token cookie로 복원
-      try {
-        const res = await api.post<LoginResponse>("/api/auth/refresh");
-        const token = res.data.accessToken;
-        setAccessToken(token);
-        api.defaults.headers.common["Authorization"] = `Bearer ${token}`;
-      } catch {
-        // No valid session
-      } finally {
-        setIsLoading(false);
-      }
-    };
-    restoreSession();
-  }, [setAccessToken]);
-
-  useEffect(() => {
-    if (accessToken) {
-      api.defaults.headers.common["Authorization"] = `Bearer ${accessToken}`;
-    } else {
-      delete api.defaults.headers.common["Authorization"];
-    }
-  }, [accessToken]);
-
-  const login = useCallback((response: LoginResponse) => {
-    setAccessToken(response.accessToken);
-  }, [setAccessToken]);
-
-  const logout = useCallback(async () => {
-    try {
-      await api.post("/api/auth/logout");
-    } catch {
-      // Ignore logout errors
-    }
-    setAccessToken(null);
-    window.location.href = "/login";
-  }, [setAccessToken]);
-
-  // ref로 최신 logout 유지 (interceptor에서 사용)
-  useEffect(() => {
-    logoutRef.current = logout;
-  }, [logout]);
-
  return (
-    <AuthContext.Provider
-      value={{
-        isAuthenticated: !!accessToken,
-        isLoading,
-        accessToken,
-        login,
-        logout,
-        setAccessToken,
-      }}
-    >
+    <AuthContext.Provider value={{ isAuthenticated: !!accessToken, isLoading, accessToken, login, logout, setAccessToken: (t) => saveTokens(t) }}>
      {children}
    </AuthContext.Provider>
  );
--- a/tts-server.py
+++ b/tts-server.py
@@ -0,0 +1,216 @@
+"""
+Qwen3-TTS Voice Clone API Server (최적화 버전)
+- 0.6B 모델 사용 (A10 속도 최적화)
+- 모델 1회 로드, voice clone prompt 캐시
+- inference_mode, bf16
+- 문장 단위 분할
+"""
+import os
+import io
+import json
+import pickle
+import re
+import tempfile
+import time
+import uuid
+import threading
+
+import numpy as np
+import soundfile as sf
+import torch
+from fastapi import FastAPI, UploadFile, File, Form
+from fastapi.responses import StreamingResponse, FileResponse
+from fastapi.middleware.cors import CORSMiddleware
+
+app = FastAPI()
+app.add_middleware(CORSMiddleware, allow_origins=["*"], allow_methods=["*"], allow_headers=["*"])
+
+PROFILES_DIR = os.path.join(os.path.dirname(__file__), "voice-profiles")
+os.makedirs(PROFILES_DIR, exist_ok=True)
+
+MODEL_NAME = "Qwen/Qwen3-TTS-12Hz-1.7B-Base"
+model = None
+prompt_cache = {}  # profile_id → voice_clone_prompt
+
+
+def get_model():
+    global model
+    if model is None:
+        from qwen_tts import Qwen3TTSModel
+        print(f"Loading {MODEL_NAME}...")
+        torch.set_grad_enabled(False)
+        torch.backends.cuda.matmul.allow_tf32 = True
+        torch.backends.cudnn.allow_tf32 = True
+        dtype = torch.bfloat16 if torch.cuda.is_bf16_supported() else torch.float16
+        model = Qwen3TTSModel.from_pretrained(
+            MODEL_NAME, device_map="cuda:0", dtype=dtype,
+        )
+        # 프로필 프롬프트 캐시 로드
+        load_all_prompts()
+        print("Model loaded!")
+    return model
+
+
+def load_all_prompts():
+    """모든 프로필의 voice clone prompt를 메모리에 캐시"""
+    global prompt_cache
+    for f in os.listdir(PROFILES_DIR):
+        if f.endswith(".pkl"):
+            pid = f.replace(".pkl", "")
+            try:
+                with open(os.path.join(PROFILES_DIR, f), "rb") as fh:
+                    prompt_cache[pid] = pickle.load(fh)
+                print(f"  Cached prompt: {pid}")
+            except Exception as e:
+                print(f"  Failed to cache {pid}: {e}")
+
+
+def get_prompt(profile_id: str):
+    """캐시에서 프롬프트 가져오기, 없으면 파일에서 로드"""
+    if profile_id in prompt_cache:
+        return prompt_cache[profile_id]
+
+    pkl_path = os.path.join(PROFILES_DIR, f"{profile_id}.pkl")
+    if os.path.exists(pkl_path):
+        with open(pkl_path, "rb") as f:
+            prompt = pickle.load(f)
+        prompt_cache[profile_id] = prompt
+        return prompt
+    return None
+
+
+# === API ===
+
+@app.get("/health")
+@app.get("/api/tts/health")
+def health():
+    return {"status": "ok", "model": MODEL_NAME, "model_loaded": model is not None}
+
+
+@app.get("/api/tts/profiles")
+def list_profiles():
+    profiles = []
+    for f in os.listdir(PROFILES_DIR):
+        if f.endswith(".json"):
+            with open(os.path.join(PROFILES_DIR, f)) as fh:
+                profiles.append(json.load(fh))
+    return profiles
+
+
+@app.post("/api/tts/profiles")
+async def create_profile(
+    name: str = Form(...),
+    ref_audio: UploadFile = File(...),
+    ref_text: str = Form(""),
+):
+    m = get_model()
+    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
+        content = await ref_audio.read()
+        tmp.write(content)
+        tmp_path = tmp.name
+
+    try:
+        if not ref_audio.filename.endswith(".wav"):
+            wav_path = tmp_path + "_converted.wav"
+            os.system(f'ffmpeg -i "{tmp_path}" -ar 16000 -ac 1 -y "{wav_path}" 2>/dev/null')
+            os.unlink(tmp_path)
+            tmp_path = wav_path
+
+        kwargs = {"ref_audio": tmp_path}
+        if ref_text and ref_text.strip():
+            kwargs["ref_text"] = ref_text
+        else:
+            kwargs["x_vector_only_mode"] = True
+
+        with torch.inference_mode():
+            prompt = m.create_voice_clone_prompt(**kwargs)
+
+        profile_id = name.replace(" ", "_").lower()
+
+        # wav, pkl, json 저장
+        import shutil
+        shutil.copy2(tmp_path, os.path.join(PROFILES_DIR, f"{profile_id}.wav"))
+        with open(os.path.join(PROFILES_DIR, f"{profile_id}.pkl"), "wb") as f:
+            pickle.dump(prompt, f)
+        with open(os.path.join(PROFILES_DIR, f"{profile_id}.json"), "w") as f:
+            json.dump({"id": profile_id, "name": name, "ref_text": ref_text}, f, ensure_ascii=False)
+
+        # 캐시에 추가
+        prompt_cache[profile_id] = prompt
+
+        return {"id": profile_id, "name": name, "status": "created"}
+    finally:
+        if os.path.exists(tmp_path):
+            os.unlink(tmp_path)
+
+
+@app.delete("/api/tts/profiles/{profile_id}")
+def delete_profile(profile_id: str):
+    for ext in [".pkl", ".json", ".wav"]:
+        p = os.path.join(PROFILES_DIR, f"{profile_id}{ext}")
+        if os.path.exists(p):
+            os.unlink(p)
+    prompt_cache.pop(profile_id, None)
+    return {"status": "deleted"}
+
+
+@app.post("/api/tts/speak")
+async def speak(
+    text: str = Form(...),
+    profile_id: str = Form(...),
+    language: str = Form("Korean"),
+):
+    """한 문장 TTS — 캐시된 프롬프트 사용, 바로 wav 반환"""
+    m = get_model()
+
+    prompt = get_prompt(profile_id)
+    if prompt is None:
+        # 프롬프트가 없으면 ref_audio로 직접
+        meta_path = os.path.join(PROFILES_DIR, f"{profile_id}.json")
+        ref_audio_path = os.path.join(PROFILES_DIR, f"{profile_id}.wav")
+        if not os.path.exists(ref_audio_path):
+            return {"error": "Profile not found"}, 404
+
+        with open(meta_path) as f:
+            meta = json.load(f)
+
+        kwargs = {"text": text, "language": language, "ref_audio": ref_audio_path}
+        if meta.get("ref_text"):
+            kwargs["ref_text"] = meta["ref_text"]
+        else:
+            kwargs["x_vector_only_mode"] = True
+
+        start = time.perf_counter()
+        with torch.inference_mode():
+            wavs, sr = m.generate_voice_clone(**kwargs)
+        elapsed = time.perf_counter() - start
+    else:
+        start = time.perf_counter()
+        with torch.inference_mode():
+            wavs, sr = m.generate_voice_clone(
+                text=text, language=language, voice_clone_prompt=prompt,
+            )
+        elapsed = time.perf_counter() - start
+
+    audio_data = np.array(wavs[0], dtype=np.float32)
+    print(f"speak: {len(text)} chars → {len(audio_data)/sr:.1f}s audio in {elapsed:.1f}s")
+
+    buf = io.BytesIO()
+    sf.write(buf, audio_data, sr, format="WAV")
+    buf.seek(0)
+    return StreamingResponse(buf, media_type="audio/wav")
+
+
+from fastapi.responses import JSONResponse
+
+@app.exception_handler(Exception)
+async def global_exception_handler(request, exc):
+    import traceback
+    traceback.print_exc()
+    return JSONResponse(status_code=500, content={"error": str(exc)})
+
+
+if __name__ == "__main__":
+    import uvicorn
+    get_model()
+    uvicorn.run(app, host="0.0.0.0", port=8090)