refactor: 精简架构，去掉书籍管理，核心 TTS 代理

- 去掉 books/chapters CRUD、SQLAlchemy、SQLite 依赖 - 核心只剩 /api/tts + 智能分段 + 自动重试 - 新增 API_TOKEN 环境变量，管理接口 Bearer Token 鉴权 - 管理接口精简为 preview + config - 前端重写：TTS 试听 + 配置查看 + 接口文档 - Dockerfile/docker-compose 清理，去掉数据库卷
2026-03-27 15:10:58 +08:00
parent 30544f7f42
commit 2a87020b48
11 changed files with 381 additions and 1503 deletions
--- a/app/main.py
+++ b/app/main.py
@@ -1,6 +1,6 @@
 """
-TTS Book Service - 小米 MiMo TTS 转换服务
-为听书 App 提供音频接入接口
+TTS Proxy Service - 小米 MiMo TTS 音频转换代理
+核心功能: /api/tts 实时 TTS + 智能分段 + 自动重试
 """

 import os
@@ -15,13 +15,9 @@ from contextlib import asynccontextmanager
 from pathlib import Path

 import httpx
-from fastapi import FastAPI, HTTPException, Query, Request
-from fastapi.responses import FileResponse, HTMLResponse, JSONResponse, Response
+from fastapi import FastAPI, HTTPException, Request, Depends
+from fastapi.responses import FileResponse, HTMLResponse, Response
 from fastapi.staticfiles import StaticFiles
-from sqlalchemy import Column, Integer, String, Text, DateTime, func, select, delete
-from sqlalchemy.ext.asyncio import create_async_engine, AsyncSession, async_sessionmaker
-from sqlalchemy.orm import DeclarativeBase
-from urllib.parse import parse_qs, unquote

 import config

@@ -32,29 +28,24 @@ logging.basicConfig(
    format="%(asctime)s [%(levelname)s] %(message)s",
    datefmt="%Y-%m-%d %H:%M:%S",
 )
-logger = logging.getLogger("tts-service")
+logger = logging.getLogger("tts-proxy")

 # ── Text Segmentation ─────────────────────────────────────────────────────

-# MiMo TTS 单次请求文本上限（保守值，实际约 5000）
 MAX_CHUNK_CHARS = 2000

-# 分割优先级: 段落 > 句子 > 逗号/分号 > 按长度硬切
 _SEGMENT_PATTERNS = [
    "\n\n",      # 段落
    "\n",        # 换行
-    "。", "！", "？", "…",   # 中文句末
-    ".", "!", "?",          # 英文句末
-    "；", ";",              # 分号
-    "，", ",",              # 逗号
+    "。", "！", "？", "…",
+    ".", "!", "?",
+    "；", ";",
+    "，", ",",
 ]


 def split_text(text: str, max_chars: int = MAX_CHUNK_CHARS) -> list[str]:
-    """
-    智能分段：尽量在自然边界（段落/句子/标点）处切分，
-    保证每段不超过 max_chars 字符。
-    """
+    """智能分段：在自然边界切分，每段不超过 max_chars"""
    text = text.strip()
    if len(text) <= max_chars:
        return [text]
@@ -67,7 +58,6 @@ def split_text(text: str, max_chars: int = MAX_CHUNK_CHARS) -> list[str]:
            chunks.append(remaining)
            break

-        # 在 max_chars 范围内找最佳切割点
        window = remaining[:max_chars]
        cut_pos = -1

@@ -78,7 +68,6 @@ def split_text(text: str, max_chars: int = MAX_CHUNK_CHARS) -> list[str]:
                break

        if cut_pos <= 0:
-            # 没找到任何分隔符，硬切
            cut_pos = max_chars

        chunk = remaining[:cut_pos].strip()
@@ -89,16 +78,35 @@ def split_text(text: str, max_chars: int = MAX_CHUNK_CHARS) -> list[str]:
    return chunks


-# ── Audio Concatenation ───────────────────────────────────────────────────
+# ── Auth ──────────────────────────────────────────────────────────────────
+
+async def verify_token(request: Request):
+    """Bearer Token 验证（API_TOKEN 未配置时跳过）"""
+    if not config.API_TOKEN:
+        return
+    auth = request.headers.get("Authorization", "")
+    if not auth.startswith("Bearer "):
+        raise HTTPException(401, "缺少 Authorization: Bearer <token>")
+    if auth[7:] != config.API_TOKEN:
+        raise HTTPException(403, "Token 无效")
+
+
+# ── Audio Utils ───────────────────────────────────────────────────────────
+
+def wav_to_mp3(wav_path: str, mp3_path: str):
+    result = subprocess.run(
+        ["ffmpeg", "-y", "-i", wav_path, "-codec:a", "libmp3lame", "-qscale:a", "2", mp3_path],
+        capture_output=True, text=True,
+    )
+    if result.returncode != 0:
+        raise RuntimeError(f"ffmpeg 转换失败: {result.stderr[:300]}")
+

 def concat_mp3_files(mp3_paths: list[str], output_path: str):
-    """用 ffmpeg 将多个 MP3 文件拼接为一个"""
-    # 创建 ffmpeg concat 文件列表
    list_path = output_path + ".concat_list.txt"
    with open(list_path, "w") as f:
        for p in mp3_paths:
            f.write(f"file '{p}'\n")
-
    try:
        result = subprocess.run(
            ["ffmpeg", "-y", "-f", "concat", "-safe", "0", "-i", list_path,
@@ -111,46 +119,15 @@ def concat_mp3_files(mp3_paths: list[str], output_path: str):
        os.remove(list_path)


-# ── Database ──────────────────────────────────────────────────────────────
-
-engine = create_async_engine(config.DATABASE_URL, echo=False)
-async_session = async_sessionmaker(engine, class_=AsyncSession, expire_on_commit=False)
-
-
-class Base(DeclarativeBase):
-    pass
-
-
-class Book(Base):
-    __tablename__ = "books"
-    id = Column(Integer, primary_key=True, autoincrement=True)
-    book_id = Column(String(100), unique=True, nullable=False, index=True)
-    title = Column(String(500), nullable=False)
-    author = Column(String(200), default="")
-    created_at = Column(DateTime, server_default=func.now())
-
-
-class Chapter(Base):
-    __tablename__ = "chapters"
-    id = Column(Integer, primary_key=True, autoincrement=True)
-    book_id = Column(String(100), nullable=False, index=True)
-    chapter_id = Column(String(100), nullable=False, index=True)
-    app_chapter_id = Column(String(100), default="")
-    title = Column(String(500), default="")
-    text_content = Column(Text, default="")
-    audio_file = Column(String(500), default="")
-    status = Column(String(20), default="pending")
-    error_msg = Column(Text, default="")
-    created_at = Column(DateTime, server_default=func.now())
-    updated_at = Column(DateTime, server_default=func.now(), onupdate=func.now())
-
-
 # ── TTS Service ───────────────────────────────────────────────────────────

+MAX_TTS_RETRIES = 3
+
+
 async def call_mimo_tts(text: str, style: str = "", voice: str = "") -> bytes:
-    """调用小米 MiMo TTS API，返回 WAV 音频字节"""
+    """调用 MiMo TTS API，返回 WAV 字节。5xx 自动重试最多 3 次"""
    if not config.MIMO_API_KEY:
-        raise HTTPException(500, "MIMO_API_KEY 未配置，请设置环境变量")
+        raise HTTPException(500, "MIMO_API_KEY 未配置")

    content = f"<style>{style}</style>{text}" if style else text
    use_voice = voice or config.MIMO_VOICE
@@ -160,539 +137,216 @@ async def call_mimo_tts(text: str, style: str = "", voice: str = "") -> bytes:
        "audio": {"format": "wav", "voice": use_voice},
        "messages": [{"role": "assistant", "content": content}],
    }
-
    headers = {
        "Content-Type": "application/json",
        "api-key": config.MIMO_API_KEY,
    }

-    t0 = time.time()
-    logger.info(f"MiMo TTS 请求: text_len={len(text)}, style={style or '(默认)'}")
-
-    async with httpx.AsyncClient(timeout=120) as client:
-        resp = await client.post(config.MIMO_API_ENDPOINT, json=payload, headers=headers)
-
-    elapsed = round(time.time() - t0, 2)
-
-    if resp.status_code != 200:
-        logger.error(f"MiMo TTS 错误: HTTP {resp.status_code}, 耗时 {elapsed}s, 响应: {resp.text[:200]}")
-        raise HTTPException(502, f"MiMo TTS API 错误: HTTP {resp.status_code} - {resp.text[:300]}")
-
-    data = resp.json()
-    if data.get("error"):
-        logger.error(f"MiMo TTS 业务错误: {data['error']}, 耗时 {elapsed}s")
-        raise HTTPException(502, f"MiMo TTS 错误: {data['error']}")
-
-    try:
-        audio_b64 = data["choices"][0]["message"]["audio"]["data"]
-        wav_bytes = base64.b64decode(audio_b64)
-        logger.info(f"MiMo TTS 成功: wav_size={len(wav_bytes)} bytes, 耗时 {elapsed}s")
-        return wav_bytes
-    except (KeyError, IndexError, TypeError) as e:
-        logger.error(f"MiMo TTS 响应解析失败: {e}, 耗时 {elapsed}s")
-        raise HTTPException(502, f"MiMo TTS 响应解析失败: {e}")
-
-
-def wav_to_mp3(wav_path: str, mp3_path: str):
-    """用 ffmpeg 将 WAV 转为 MP3"""
-    result = subprocess.run(
-        ["ffmpeg", "-y", "-i", wav_path, "-codec:a", "libmp3lame", "-qscale:a", "2", mp3_path],
-        capture_output=True, text=True,
-    )
-    if result.returncode != 0:
-        raise RuntimeError(f"ffmpeg 转换失败: {result.stderr[:300]}")
-
-
-async def generate_chapter_audio(chapter_id_str: str):
-    """为指定章节生成音频（支持长文本自动分段拼接）"""
-    async with async_session() as db:
-        result = await db.execute(select(Chapter).where(Chapter.chapter_id == chapter_id_str))
-        chapter = result.scalar_one_or_none()
-        if not chapter:
-            return
-
-        if not chapter.text_content.strip():
-            chapter.status = "error"
-            chapter.error_msg = "文本内容为空"
-            await db.commit()
-            return
-
-        chapter.status = "generating"
-        await db.commit()
-
+    last_exc = None
+    for attempt in range(1, MAX_TTS_RETRIES + 1):
+        t0 = time.time()
        try:
-            audio_dir = Path(config.AUDIO_DIR) / chapter.book_id
-            audio_dir.mkdir(parents=True, exist_ok=True)
+            async with httpx.AsyncClient(timeout=120) as client:
+                resp = await client.post(config.MIMO_API_ENDPOINT, json=payload, headers=headers)

-            mp3_path = str(audio_dir / f"{chapter.chapter_id}.mp3")
-            chunks = split_text(chapter.text_content)
+            elapsed = round(time.time() - t0, 2)

-            if len(chunks) == 1:
-                # 单段：直接生成
-                wav_bytes = await call_mimo_tts(chapter.text_content)
-                wav_path = str(audio_dir / f"{chapter.chapter_id}.wav")
-                with open(wav_path, "wb") as f:
-                    f.write(wav_bytes)
-                loop = asyncio.get_event_loop()
-                await loop.run_in_executor(None, wav_to_mp3, wav_path, mp3_path)
-                os.remove(wav_path)
-            else:
-                # 多段：逐段生成 → 拼接
-                logger.info(f"章节 {chapter_id_str}: 文本 {len(chapter.text_content)} 字, 分 {len(chunks)} 段生成")
-                tmp_mp3_paths = []
-                for i, chunk in enumerate(chunks):
-                    wav_bytes = await call_mimo_tts(chunk)
-                    tmp_id = f"{chapter.chapter_id}_part{i}"
-                    wav_path = str(audio_dir / f"{tmp_id}.wav")
-                    tmp_mp3 = str(audio_dir / f"{tmp_id}.mp3")
+            if resp.status_code != 200:
+                logger.error(f"MiMo TTS HTTP {resp.status_code}, {elapsed}s, {resp.text[:200]}")
+                err = HTTPException(502, f"MiMo TTS API 错误: HTTP {resp.status_code}")
+                if resp.status_code >= 500 and attempt < MAX_TTS_RETRIES:
+                    last_exc = err
+                    await asyncio.sleep(1.5 * attempt)
+                    continue
+                raise err

-                    with open(wav_path, "wb") as f:
-                        f.write(wav_bytes)
+            data = resp.json()
+            if data.get("error"):
+                raise HTTPException(502, f"MiMo TTS 错误: {data['error']}")

-                    loop = asyncio.get_event_loop()
-                    await loop.run_in_executor(None, wav_to_mp3, wav_path, tmp_mp3)
-                    os.remove(wav_path)
-                    tmp_mp3_paths.append(tmp_mp3)
+            audio_b64 = data["choices"][0]["message"]["audio"]["data"]
+            wav_bytes = base64.b64decode(audio_b64)
+            logger.info(f"MiMo TTS OK: {len(wav_bytes)} bytes, {elapsed}s (attempt {attempt})")
+            return wav_bytes

-                # 拼接
-                await loop.run_in_executor(None, concat_mp3_files, tmp_mp3_paths, mp3_path)
-                for p in tmp_mp3_paths:
-                    os.remove(p)
-                logger.info(f"章节 {chapter_id_str}: {len(chunks)} 段拼接完成")
-
-            chapter.audio_file = mp3_path
-            chapter.status = "ready"
-            chapter.error_msg = ""
+        except HTTPException:
+            raise
        except Exception as e:
-            chapter.status = "error"
-            chapter.error_msg = str(e)[:500]
-            logger.error(f"章节 {chapter_id_str} 生成失败: {e}")
+            elapsed = round(time.time() - t0, 2)
+            logger.error(f"MiMo TTS 异常: {e}, {elapsed}s, attempt {attempt}")
+            last_exc = HTTPException(502, f"MiMo TTS 异常: {e}")
+            if attempt < MAX_TTS_RETRIES:
+                await asyncio.sleep(1.5 * attempt)

-        await db.commit()
+    raise last_exc


-# ── App Lifecycle ──────────────────────────────────────────────────────────
+# ── Core: generate MP3 from text ──────────────────────────────────────────
+
+async def generate_mp3(text: str, style: str = "", voice: str = "") -> bytes:
+    """文本 → MP3 字节。长文本自动分段拼接"""
+    chunks = split_text(text)
+    tmp_dir = Path(config.AUDIO_DIR) / "_tmp"
+    tmp_dir.mkdir(parents=True, exist_ok=True)
+
+    if len(chunks) == 1:
+        wav_bytes = await call_mimo_tts(text, style, voice)
+        uid = uuid.uuid4().hex
+        wav_path = str(tmp_dir / f"{uid}.wav")
+        mp3_path = str(tmp_dir / f"{uid}.mp3")
+        with open(wav_path, "wb") as f:
+            f.write(wav_bytes)
+        loop = asyncio.get_event_loop()
+        await loop.run_in_executor(None, wav_to_mp3, wav_path, mp3_path)
+        with open(mp3_path, "rb") as f:
+            mp3_bytes = f.read()
+        os.remove(wav_path)
+        os.remove(mp3_path)
+        return mp3_bytes
+
+    # 多段
+    logger.info(f"文本 {len(text)} 字, 分 {len(chunks)} 段生成")
+    mp3_paths = []
+    for chunk in chunks:
+        wav_bytes = await call_mimo_tts(chunk, style, voice)
+        uid = uuid.uuid4().hex
+        wav_path = str(tmp_dir / f"{uid}.wav")
+        mp3_path = str(tmp_dir / f"{uid}.mp3")
+        with open(wav_path, "wb") as f:
+            f.write(wav_bytes)
+        loop = asyncio.get_event_loop()
+        await loop.run_in_executor(None, wav_to_mp3, wav_path, mp3_path)
+        os.remove(wav_path)
+        mp3_paths.append(mp3_path)
+
+    merged_id = uuid.uuid4().hex
+    merged_path = str(tmp_dir / f"{merged_id}.mp3")
+    await loop.run_in_executor(None, concat_mp3_files, mp3_paths, merged_path)
+    with open(merged_path, "rb") as f:
+        mp3_bytes = f.read()
+    for p in mp3_paths:
+        os.remove(p)
+    os.remove(merged_path)
+    return mp3_bytes
+
+
+# ── App ───────────────────────────────────────────────────────────────────

@asynccontextmanager
 async def lifespan(app: FastAPI):
    os.makedirs(config.AUDIO_DIR, exist_ok=True)
-    os.makedirs(os.path.join(config.BASE_DIR, "data"), exist_ok=True)
-    async with engine.begin() as conn:
-        await conn.run_sync(Base.metadata.create_all)
+    (Path(config.AUDIO_DIR) / "_tmp").mkdir(exist_ok=True)
+    (Path(config.AUDIO_DIR) / "_preview").mkdir(exist_ok=True)
    yield


-app = FastAPI(title="TTS Book Service", lifespan=lifespan)
+app = FastAPI(title="TTS Proxy Service", lifespan=lifespan)


+# ── 健康检查 ───────────────────────────────────────────────────────────────
+
@app.get("/health")
-async def health_check():
-    """健康检查"""
-    return {"status": "ok", "service": "TTS Book Service", "api_key_configured": bool(config.MIMO_API_KEY)}
+async def health():
+    return {
+        "status": "ok",
+        "api_key": bool(config.MIMO_API_KEY),
+        "token": bool(config.API_TOKEN),
+    }


-# ── 听书 App 音频接入接口 ─────────────────────────────────────────────────
-
-@app.get("/api/book/{book_id}")
-async def get_book_info(book_id: str):
-    """获取书籍信息及章节列表（听书 App 调用）"""
-    async with async_session() as db:
-        book_result = await db.execute(select(Book).where(Book.book_id == book_id))
-        book = book_result.scalar_one_or_none()
-        if not book:
-            raise HTTPException(404, f"书籍 {book_id} 不存在")
-
-        ch_result = await db.execute(
-            select(Chapter).where(Chapter.book_id == book_id).order_by(Chapter.id)
-        )
-        chapters = ch_result.scalars().all()
-
-        return {
-            "book_id": book.book_id,
-            "title": book.title,
-            "author": book.author,
-            "chapters": [
-                {
-                    "chapter_id": ch.chapter_id,
-                    "app_chapter_id": ch.app_chapter_id,
-                    "title": ch.title,
-                    "status": ch.status,
-                    "audio_url": f"/api/book/{book_id}/chapter/{ch.chapter_id}/audio"
-                    if ch.status == "ready" else None,
-                }
-                for ch in chapters
-            ],
-        }
-
-
-@app.get("/api/book/{book_id}/chapter/{chapter_id}/audio")
-async def get_chapter_audio(book_id: str, chapter_id: str):
-    """获取章节音频文件（听书 App 调用）"""
-    async with async_session() as db:
-        result = await db.execute(
-            select(Chapter).where(
-                Chapter.book_id == book_id, Chapter.chapter_id == chapter_id
-            )
-        )
-        chapter = result.scalar_one_or_none()
-
-    if not chapter:
-        raise HTTPException(404, "章节不存在")
-    if chapter.status != "ready" or not chapter.audio_file:
-        raise HTTPException(404, f"音频尚未生成，当前状态: {chapter.status}")
-
-    if not os.path.exists(chapter.audio_file):
-        raise HTTPException(404, "音频文件丢失")
-
-    return FileResponse(chapter.audio_file, media_type="audio/mpeg", filename=f"{chapter_id}.mp3")
-
-
-# ── 实时 TTS 接口（兼容听书 App 格式）─────────────────────────────────────
+# ── 核心接口: 实时 TTS ────────────────────────────────────────────────────

@app.post("/api/tts")
 async def realtime_tts(request: Request):
    """
-    实时 TTS 生成接口
-    兼容两种 App 发送格式:
-      1. JSON body:  {"text": "内容", "style": "开心"}
-      2. Form body:  tex=内容&spd=5 (百度风格)
-    返回: MP3 音频二进制流 (audio/mpeg)，失败返回 JSON
+    实时 TTS → 返回 MP3 音频流
+
+    JSON: {"text": "内容", "style": "开心", "voice": ""}
+    Form: tex=内容 (百度兼容)
    """
-    text = ""
-    style = ""
-    voice = ""
+    text = style = voice = ""
    content_type = request.headers.get("content-type", "")

    try:
        if "json" in content_type:
            data = await request.json()
-            text = data.get("text", "").strip()
-            style = data.get("style", "").strip()
-            voice = data.get("voice", "").strip()
+            text = (data.get("text") or "").strip()
+            style = (data.get("style") or "").strip()
+            voice = (data.get("voice") or "").strip()
        else:
-            # form-urlencoded (百度风格)
-            body_bytes = await request.body()
-            params = parse_qs(body_bytes.decode("utf-8"))
-            text = (params.get("tex", [""])[0]).strip()
-            # URL 解码（百度会 double-encode）
-            text = unquote(unquote(text))
+            from urllib.parse import parse_qs, unquote
+            body = await request.body()
+            params = parse_qs(body.decode("utf-8"))
+            text = unquote(unquote((params.get("tex", [""])[0]).strip()))
    except Exception:
        pass

    if not text:
        return Response(
-            content=json.dumps({"status": 40000001, "message": "text/tex 不能为空"}, ensure_ascii=False),
-            media_type="application/json",
-            status_code=400,
+            content=json.dumps({"status": 40000001, "message": "text 不能为空"}, ensure_ascii=False),
+            media_type="application/json", status_code=400,
        )

    try:
-        # 文本分段
-        chunks = split_text(text)
-        logger.info(f"实时 TTS: text_len={len(text)}, chunks={len(chunks)}, style={style or '(默认)'}, voice={voice or '(默认)'}")
-
-        tmp_dir = Path(config.AUDIO_DIR) / "_tmp"
-        tmp_dir.mkdir(parents=True, exist_ok=True)
-
-        if len(chunks) == 1:
-            # 单段：直接生成
-            wav_bytes = await call_mimo_tts(text, style, voice)
-            tmp_id = uuid.uuid4().hex
-            wav_path = str(tmp_dir / f"{tmp_id}.wav")
-            mp3_path = str(tmp_dir / f"{tmp_id}.mp3")
-
-            with open(wav_path, "wb") as f:
-                f.write(wav_bytes)
-
-            loop = asyncio.get_event_loop()
-            await loop.run_in_executor(None, wav_to_mp3, wav_path, mp3_path)
-
-            with open(mp3_path, "rb") as f:
-                mp3_bytes = f.read()
-
-            os.remove(wav_path)
-            os.remove(mp3_path)
-        else:
-            # 多段：逐段生成 → 拼接
-            mp3_paths = []
-            for i, chunk in enumerate(chunks):
-                wav_bytes = await call_mimo_tts(chunk, style, voice)
-                chunk_id = uuid.uuid4().hex
-                wav_path = str(tmp_dir / f"{chunk_id}.wav")
-                mp3_path = str(tmp_dir / f"{chunk_id}.mp3")
-
-                with open(wav_path, "wb") as f:
-                    f.write(wav_bytes)
-
-                loop = asyncio.get_event_loop()
-                await loop.run_in_executor(None, wav_to_mp3, wav_path, mp3_path)
-                os.remove(wav_path)
-                mp3_paths.append(mp3_path)
-
-            # 拼接所有 MP3
-            merged_id = uuid.uuid4().hex
-            merged_path = str(tmp_dir / f"{merged_id}.mp3")
-            await loop.run_in_executor(None, concat_mp3_files, mp3_paths, merged_path)
-
-            with open(merged_path, "rb") as f:
-                mp3_bytes = f.read()
-
-            # 清理
-            for p in mp3_paths:
-                os.remove(p)
-            os.remove(merged_path)
-
+        mp3_bytes = await generate_mp3(text, style, voice)
        return Response(content=mp3_bytes, media_type="audio/mpeg")
-
    except Exception as e:
        return Response(
-            content=json.dumps({"status": 50000002, "message": str(e)[:300]}, ensure_ascii=False),
-            media_type="application/json",
-            status_code=500,
+            content=json.dumps({"status": 500, "message": str(e)[:300]}, ensure_ascii=False),
+            media_type="application/json", status_code=500,
        )


-# ── 管理 API ──────────────────────────────────────────────────────────────
+# ── 管理接口 ───────────────────────────────────────────────────────────────

-# --- Books ---
-
-@app.get("/admin/api/books")
-async def list_books():
-    async with async_session() as db:
-        result = await db.execute(select(Book).order_by(Book.id.desc()))
-        books = result.scalars().all()
-        return [{"book_id": b.book_id, "title": b.title, "author": b.author} for b in books]
-
-
-@app.post("/admin/api/books")
-async def create_book(request: Request):
+@app.post("/admin/api/preview")
+async def preview(request: Request, _auth=Depends(verify_token)):
+    """TTS 试听，返回音频 URL"""
    data = await request.json()
-    book_id = data.get("book_id", "").strip()
-    title = data.get("title", "").strip()
-    author = data.get("author", "").strip()
-
-    if not book_id or not title:
-        raise HTTPException(400, "book_id 和 title 不能为空")
-
-    async with async_session() as db:
-        existing = await db.execute(select(Book).where(Book.book_id == book_id))
-        if existing.scalar_one_or_none():
-            raise HTTPException(409, f"书籍 {book_id} 已存在")
-
-        book = Book(book_id=book_id, title=title, author=author)
-        db.add(book)
-        await db.commit()
-        return {"ok": True, "book_id": book_id}
-
-
-@app.delete("/admin/api/books/{book_id}")
-async def delete_book(book_id: str):
-    async with async_session() as db:
-        await db.execute(delete(Chapter).where(Chapter.book_id == book_id))
-        await db.execute(delete(Book).where(Book.book_id == book_id))
-        await db.commit()
-        return {"ok": True}
-
-
-# --- Chapters ---
-
-@app.get("/admin/api/books/{book_id}/chapters")
-async def list_chapters(book_id: str):
-    async with async_session() as db:
-        result = await db.execute(
-            select(Chapter).where(Chapter.book_id == book_id).order_by(Chapter.id)
-        )
-        chapters = result.scalars().all()
-        return [
-            {
-                "chapter_id": ch.chapter_id,
-                "app_chapter_id": ch.app_chapter_id,
-                "title": ch.title,
-                "text_content": ch.text_content[:200] + "..." if len(ch.text_content) > 200 else ch.text_content,
-                "text_length": len(ch.text_content),
-                "status": ch.status,
-                "error_msg": ch.error_msg,
-                "has_audio": ch.status == "ready",
-            }
-            for ch in chapters
-        ]
-
-
-@app.post("/admin/api/books/{book_id}/chapters")
-async def create_chapter(book_id: str, request: Request):
-    data = await request.json()
-    chapter_id = data.get("chapter_id", "").strip()
-    title = data.get("title", "").strip()
-    app_chapter_id = data.get("app_chapter_id", "").strip()
-    text_content = data.get("text_content", "").strip()
-
-    if not chapter_id:
-        raise HTTPException(400, "chapter_id 不能为空")
-
-    async with async_session() as db:
-        existing = await db.execute(
-            select(Chapter).where(Chapter.book_id == book_id, Chapter.chapter_id == chapter_id)
-        )
-        if existing.scalar_one_or_none():
-            raise HTTPException(409, f"章节 {chapter_id} 已存在")
-
-        chapter = Chapter(
-            book_id=book_id,
-            chapter_id=chapter_id,
-            app_chapter_id=app_chapter_id or chapter_id,
-            title=title,
-            text_content=text_content,
-        )
-        db.add(chapter)
-        await db.commit()
-        return {"ok": True, "chapter_id": chapter_id}
-
-
-@app.put("/admin/api/books/{book_id}/chapters/{chapter_id}")
-async def update_chapter(book_id: str, chapter_id: str, request: Request):
-    data = await request.json()
-    async with async_session() as db:
-        result = await db.execute(
-            select(Chapter).where(Chapter.book_id == book_id, Chapter.chapter_id == chapter_id)
-        )
-        chapter = result.scalar_one_or_none()
-        if not chapter:
-            raise HTTPException(404, "章节不存在")
-
-        if "text_content" in data:
-            chapter.text_content = data["text_content"]
-        if "title" in data:
-            chapter.title = data["title"]
-        if "app_chapter_id" in data:
-            chapter.app_chapter_id = data["app_chapter_id"]
-
-        await db.commit()
-        return {"ok": True}
-
-
-@app.delete("/admin/api/books/{book_id}/chapters/{chapter_id}")
-async def delete_chapter(book_id: str, chapter_id: str):
-    async with async_session() as db:
-        await db.execute(
-            delete(Chapter).where(Chapter.book_id == book_id, Chapter.chapter_id == chapter_id)
-        )
-        await db.commit()
-        return {"ok": True}
-
-
-# --- TTS ---
-
-@app.post("/admin/api/books/{book_id}/chapters/{chapter_id}/generate")
-async def generate_audio(book_id: str, chapter_id: str):
-    """手动生成单章音频"""
-    await generate_chapter_audio(chapter_id)
-    async with async_session() as db:
-        result = await db.execute(
-            select(Chapter).where(Chapter.book_id == book_id, Chapter.chapter_id == chapter_id)
-        )
-        ch = result.scalar_one_or_none()
-    return {"ok": True, "status": ch.status, "error_msg": ch.error_msg}
-
-
-@app.post("/admin/api/books/{book_id}/generate-all")
-async def generate_all_chapters(book_id: str):
-    """批量生成书籍所有章节音频（并发，限制 3 路）"""
-    async with async_session() as db:
-        result = await db.execute(
-            select(Chapter).where(Chapter.book_id == book_id, Chapter.status != "ready")
-        )
-        chapters = result.scalars().all()
-
-    chapter_ids = [ch.chapter_id for ch in chapters]
-    if not chapter_ids:
-        return {"ok": True, "total": 0, "chapter_ids": [], "message": "没有需要生成的章节"}
-
-    # 并发生成，限制同时 3 个请求避免过载
-    sem = asyncio.Semaphore(3)
-
-    async def _gen(cid: str):
-        async with sem:
-            await generate_chapter_audio(cid)
-
-    tasks = [_gen(cid) for cid in chapter_ids]
-    results = await asyncio.gather(*tasks, return_exceptions=True)
-
-    # 统计结果
-    errors = [str(r) for r in results if isinstance(r, Exception)]
-    success_count = len(chapter_ids) - len(errors)
-
-    return {
-        "ok": True,
-        "total": len(chapter_ids),
-        "success": success_count,
-        "failed": len(errors),
-        "errors": errors[:10] if errors else [],
-        "chapter_ids": chapter_ids,
-    }
-
-
-# --- TTS 试听 ---
-
-@app.post("/admin/api/tts/preview")
-async def tts_preview(request: Request):
-    """试听 TTS 效果"""
-    data = await request.json()
-    text = data.get("text", "").strip()
-    style = data.get("style", "").strip()
-    voice = data.get("voice", "").strip()
-
+    text = (data.get("text") or "").strip()
+    style = (data.get("style") or "").strip()
+    voice = (data.get("voice") or "").strip()
    if not text:
        raise HTTPException(400, "文本不能为空")

-    wav_bytes = await call_mimo_tts(text, style, voice)
-    audio_dir = Path(config.AUDIO_DIR) / "_preview"
-    audio_dir.mkdir(parents=True, exist_ok=True)
-
+    mp3_bytes = await generate_mp3(text, style, voice)
+    preview_dir = Path(config.AUDIO_DIR) / "_preview"
    filename = f"{uuid.uuid4().hex}.mp3"
-    wav_path = str(audio_dir / f"{uuid.uuid4().hex}.wav")
-    mp3_path = str(audio_dir / filename)
-
-    with open(wav_path, "wb") as f:
-        f.write(wav_bytes)
-
-    loop = asyncio.get_event_loop()
-    await loop.run_in_executor(None, wav_to_mp3, wav_path, mp3_path)
-    os.remove(wav_path)
-
+    with open(preview_dir / filename, "wb") as f:
+        f.write(mp3_bytes)
    return {"ok": True, "url": f"/audio/_preview/{filename}"}


@app.get("/admin/api/config")
-async def get_config():
+async def config_info(_auth=Depends(verify_token)):
    return {
        "endpoint": config.MIMO_API_ENDPOINT,
        "model": config.MIMO_TTS_MODEL,
        "voice": config.MIMO_VOICE,
-        "api_key_masked": config.MIMO_API_KEY[:6] + "****" if config.MIMO_API_KEY else "未配置",
-        "max_chunk_chars": MAX_CHUNK_CHARS,
+        "api_key": config.MIMO_API_KEY[:6] + "****" if config.MIMO_API_KEY else "未配置",
+        "max_chunk": MAX_CHUNK_CHARS,
+        "token_set": bool(config.API_TOKEN),
    }


 # ── 配置文件下载 ───────────────────────────────────────────────────────────

@app.get("/httpTts.json")
-async def serve_http_tts_config():
-    """提供 App 导入用的音频源配置文件"""
-    config_path = os.path.join(config.BASE_DIR, "httpTts-mimo.json")
-    if os.path.exists(config_path):
-        return FileResponse(config_path, media_type="application/json")
-    raise HTTPException(404, "配置文件不存在")
+async def serve_config():
+    path = os.path.join(config.BASE_DIR, "httpTts-mimo.json")
+    if os.path.exists(path):
+        return FileResponse(path, media_type="application/json")
+    raise HTTPException(404)


-# ── 静态文件 & 前端 ──────────────────────────────────────────────────────
+# ── 静态 & 前端 ───────────────────────────────────────────────────────────

 app.mount("/audio", StaticFiles(directory=config.AUDIO_DIR), name="audio")


@app.get("/", response_class=HTMLResponse)
 async def frontend():
-    html_path = os.path.join(config.BASE_DIR, "static", "index.html")
-    with open(html_path, "r", encoding="utf-8") as f:
+    with open(os.path.join(config.BASE_DIR, "static", "index.html"), "r", encoding="utf-8") as f:
        return HTMLResponse(f.read())