feat: add provider analytics summary

2026-04-18 22:01:34 +08:00
parent e99a7fbe14
commit 4d54c144a8
15 changed files with 437 additions and 36 deletions
--- a/README.md
+++ b/README.md
@@ -134,6 +134,7 @@ npm run build
 | GET | `/api/generations/jobs/{job_id}` | 查询生成任务事件流 |
 | GET | `/api/generations/{story_id}/jobs` | 查询故事生成与重试历史 |
 | GET | `/api/generations/{story_id}/provider-stats` | 查询 Provider 调用聚合指标 |
 | GET | `/api/generations/provider-analytics` | 查询当前用户跨故事 Provider 运营摘要 |
 | GET | `/api/stories` | 故事列表 |
 | GET | `/api/stories/{story_id}` | 故事详情 |
 | DELETE | `/api/stories/{story_id}` | 删除故事 |
--- a/admin-frontend/src/components/GenerationTrace.vue
+++ b/admin-frontend/src/components/GenerationTrace.vue
@@ -1,5 +1,5 @@
 <script setup lang="ts">
-import { computed, ref, watch } from 'vue'
+import { computed, onBeforeUnmount, ref, watch } from 'vue'
 import { BoltIcon, ClockIcon } from '@heroicons/vue/24/outline'
 import { api } from '../api/client'
 import LoadingSpinner from './ui/LoadingSpinner.vue'
@@ -64,12 +64,18 @@ const activeJob = ref<GenerationJobDetail | null>(null)
 const providerStats = ref<GenerationProviderStats | null>(null)
 const loading = ref(false)
 const error = ref('')
 let refreshTimer: ReturnType<typeof setInterval> | null = null
 const isDark = computed(() => props.tone === 'dark')
 const latestJob = computed(() => jobs.value[0] ?? null)
 const activeEvents = computed(() => activeJob.value?.events.slice(-10) ?? [])
 const activeProgress = computed(() => activeJob.value?.progress_percent ?? latestJob.value?.progress_percent ?? 0)
 const activeProgressLabel = computed(() => activeJob.value?.progress_label ?? latestJob.value?.progress_label ?? '暂无进度')
 const shouldAutoRefresh = computed(() => {
  if (activeJob.value) return !activeJob.value.is_terminal
  if (latestJob.value) return !latestJob.value.is_terminal
  return false
 })
 const providerSuccessRate = computed(() => {
  if (!providerStats.value?.total_calls) return null
  return Math.round((providerStats.value.successful_calls / providerStats.value.total_calls) * 100)
@@ -206,6 +212,13 @@ async function refresh() {
  }
 }
 function stopAutoRefresh() {
  if (refreshTimer) {
    clearInterval(refreshTimer)
    refreshTimer = null
  }
 }
 watch(
  () => props.storyId,
  () => {
@@ -214,6 +227,19 @@ watch(
  { immediate: true },
 )
 watch(shouldAutoRefresh, (enabled) => {
  stopAutoRefresh()
  if (enabled) {
    refreshTimer = setInterval(() => {
      if (!loading.value) {
        void refresh()
      }
    }, 2500)
  }
 })
 onBeforeUnmount(stopAutoRefresh)
 defineExpose({ refresh })
 </script>
--- a/admin-frontend/src/views/MyStories.vue
+++ b/admin-frontend/src/views/MyStories.vue
@@ -34,8 +34,30 @@ interface StoryItem {
  last_error: string | null
 }
 interface GenerationProviderStat {
  capability: string
  adapter: string
  call_count: number
  success_count: number
  failure_count: number
  avg_latency_ms: number | null
  estimated_cost_usd: number
 }
 interface GenerationProviderAnalytics {
  total_calls: number
  successful_calls: number
  failed_calls: number
  avg_latency_ms: number | null
  estimated_cost_usd: number
  job_count: number
  story_count: number
  by_provider: GenerationProviderStat[]
 }
 const router = useRouter()
 const stories = ref<StoryItem[]>([])
 const providerAnalytics = ref<GenerationProviderAnalytics | null>(null)
 const loading = ref(true)
 const error = ref('')
 const showCreateModal = ref(false)
@@ -45,10 +67,22 @@ const readableCount = computed(() =>
 const attentionCount = computed(() =>
  stories.value.filter((story) => needsGenerationAttention(story.generation_status)).length,
 )
 const providerSuccessRate = computed(() => {
  if (!providerAnalytics.value?.total_calls) return null
  return Math.round(
    (providerAnalytics.value.successful_calls / providerAnalytics.value.total_calls) * 100,
  )
 })
 const topProvider = computed(() => providerAnalytics.value?.by_provider[0] ?? null)
 async function fetchStories() {
  try {
-    stories.value = await api.get<StoryItem[]>('/api/stories')
+    const [storyList, analytics] = await Promise.all([
      api.get<StoryItem[]>('/api/stories'),
      api.get<GenerationProviderAnalytics>('/api/generations/provider-analytics'),
    ])
    stories.value = storyList
    providerAnalytics.value = analytics
  } catch (e) {
    error.value = e instanceof Error ? e.message : '加载失败'
  } finally {
@@ -81,6 +115,14 @@ function getStoryPath(story: StoryItem) {
  return story.mode === 'storybook' ? `/storybook/view/${story.id}` : `/story/${story.id}`
 }
 function formatLatency(value?: number | null) {
  return typeof value === 'number' ? `${Math.round(value)}ms` : '暂无'
 }
 function formatCost(value?: number | null) {
  return typeof value === 'number' ? `$${value.toFixed(4)}` : '$0.0000'
 }
 onMounted(() => {
  fetchStories()
  if (router.currentRoute.value.query.openCreate) {
@@ -160,6 +202,42 @@ onMounted(() => {
        </div>
      </BaseCard>
      <BaseCard
        v-if="providerAnalytics?.total_calls"
        class="mb-8"
        padding="lg"
      >
        <div class="flex flex-col gap-5 lg:flex-row lg:items-center lg:justify-between">
          <div>
            <h2 class="text-xl font-bold text-gray-800">Provider 运营摘要</h2>
            <p class="mt-2 text-sm leading-6 text-gray-500">
              生成、资源补全和失败恢复留下的供应商调用轨迹。
            </p>
          </div>
          <div class="grid grid-cols-2 gap-3 sm:grid-cols-4 lg:min-w-[520px]">
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">成功率</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ providerSuccessRate }}%</div>
            </div>
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">平均耗时</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ formatLatency(providerAnalytics.avg_latency_ms) }}</div>
            </div>
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">预估成本</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ formatCost(providerAnalytics.estimated_cost_usd) }}</div>
            </div>
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">调用次数</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ providerAnalytics.total_calls }}</div>
            </div>
          </div>
        </div>
        <p v-if="topProvider" class="mt-4 text-sm text-gray-500">
          当前样本中最前面的能力组合是 {{ topProvider.capability }} / {{ topProvider.adapter }}，成功 {{ topProvider.success_count }} 次，失败 {{ topProvider.failure_count }} 次。
        </p>
      </BaseCard>
      <!-- 故事网格 -->
      <div class="grid grid-cols-1 sm:grid-cols-2 lg:grid-cols-3 gap-6">
        <router-link
--- a/backend/app/api/stories.py
+++ b/backend/app/api/stories.py
@@ -19,6 +19,7 @@ from app.schemas.story_schemas import (
    GenerateRequest,
    GenerationJobDetailResponse,
    GenerationJobSummaryResponse,
    GenerationProviderAnalyticsResponse,
    GenerationProviderStatsResponse,
    GenerationRequest,
    GenerationResponse,
@@ -34,6 +35,7 @@ from app.services import story_service
 from app.services.generation_jobs import (
    get_generation_job_detail,
    get_story_provider_stats,
    get_user_provider_analytics,
    list_story_generation_jobs,
 )
 from app.services.memory_service import build_enhanced_memory_context
@@ -83,6 +85,18 @@ async def get_generation_job(
    return await get_generation_job_detail(db, job_id=job_id, user_id=user.id)
@router.get(
    "/generations/provider-analytics",
    response_model=GenerationProviderAnalyticsResponse,
 )
 async def get_generation_provider_analytics(
    user: User = Depends(require_user),
    db: AsyncSession = Depends(get_db),
 ):
    """Get provider call stats aggregated across the user's generation history."""
    return await get_user_provider_analytics(db, user_id=user.id)
@router.get(
    "/generations/{story_id}/jobs",
    response_model=list[GenerationJobSummaryResponse],
--- a/backend/app/schemas/story_schemas.py
+++ b/backend/app/schemas/story_schemas.py
@@ -222,6 +222,19 @@ class GenerationProviderStatsResponse(BaseModel):
    by_provider: list[GenerationProviderStatResponse] = Field(default_factory=list)
 class GenerationProviderAnalyticsResponse(BaseModel):
    """Provider call stats aggregated across one user's generation history."""
    total_calls: int
    successful_calls: int
    failed_calls: int
    avg_latency_ms: float | None = None
    estimated_cost_usd: float = 0.0
    job_count: int
    story_count: int
    by_provider: list[GenerationProviderStatResponse] = Field(default_factory=list)
 class AchievementItem(BaseModel):
    """Achievement item returned for a story."""
--- a/backend/app/services/generation_jobs.py
+++ b/backend/app/services/generation_jobs.py
@@ -5,7 +5,7 @@ from __future__ import annotations
 from typing import Any
 from fastapi import HTTPException
-from sqlalchemy import desc, select
+from sqlalchemy import desc, distinct, func, select
 from sqlalchemy.ext.asyncio import AsyncSession
 from app.db.models import GenerationJob, GenerationJobEvent, Story
@@ -272,28 +272,8 @@ def _as_float(value: Any) -> float | None:
    return None
-async def get_story_provider_stats(
+def _aggregate_provider_events(events: list[GenerationJobEvent]) -> dict[str, Any]:
-    db: AsyncSession,
+    """Aggregate provider telemetry from provider call events."""
    *,
    story_id: int,
    user_id: str,
 ) -> dict[str, Any]:
    """Aggregate provider call telemetry from all user-owned jobs for one story."""
    events = (
        await db.execute(
            select(GenerationJobEvent)
            .join(GenerationJob, GenerationJobEvent.job_id == GenerationJob.id)
            .where(
                GenerationJob.story_id == story_id,
                GenerationJob.user_id == user_id,
                GenerationJobEvent.event_type.in_(
                    ["provider_call_succeeded", "provider_call_failed"]
                ),
            )
            .order_by(GenerationJobEvent.id)
        )
    ).scalars().all()
    by_key: dict[tuple[str, str], dict[str, Any]] = {}
    total_latency = 0.0
@@ -363,7 +343,6 @@ async def get_story_provider_stats(
    )
    return {
        "story_id": story_id,
        "total_calls": successful_calls + failed_calls,
        "successful_calls": successful_calls,
        "failed_calls": failed_calls,
@@ -371,3 +350,66 @@ async def get_story_provider_stats(
        "estimated_cost_usd": round(total_cost, 6),
        "by_provider": by_provider,
    }
 async def get_story_provider_stats(
    db: AsyncSession,
    *,
    story_id: int,
    user_id: str,
 ) -> dict[str, Any]:
    """Aggregate provider call telemetry from all user-owned jobs for one story."""
    events = (
        await db.execute(
            select(GenerationJobEvent)
            .join(GenerationJob, GenerationJobEvent.job_id == GenerationJob.id)
            .where(
                GenerationJob.story_id == story_id,
                GenerationJob.user_id == user_id,
                GenerationJobEvent.event_type.in_(
                    ["provider_call_succeeded", "provider_call_failed"]
                ),
            )
            .order_by(GenerationJobEvent.id)
        )
    ).scalars().all()
    return {"story_id": story_id, **_aggregate_provider_events(events)}
 async def get_user_provider_analytics(
    db: AsyncSession,
    *,
    user_id: str,
 ) -> dict[str, Any]:
    """Aggregate provider telemetry across all stories owned by one user."""
    events = (
        await db.execute(
            select(GenerationJobEvent)
            .join(GenerationJob, GenerationJobEvent.job_id == GenerationJob.id)
            .where(
                GenerationJob.user_id == user_id,
                GenerationJobEvent.event_type.in_(
                    ["provider_call_succeeded", "provider_call_failed"]
                ),
            )
            .order_by(GenerationJobEvent.id)
        )
    ).scalars().all()
    job_count, story_count = (
        await db.execute(
            select(
                func.count(GenerationJob.id),
                func.count(distinct(GenerationJob.story_id)),
            ).where(GenerationJob.user_id == user_id)
        )
    ).one()
    return {
        **_aggregate_provider_events(events),
        "job_count": job_count,
        "story_count": story_count,
    }
--- a/backend/tests/test_generation_jobs.py
+++ b/backend/tests/test_generation_jobs.py
@@ -431,3 +431,123 @@ async def test_story_provider_stats_aggregate_job_events(
        ]
    finally:
        app.dependency_overrides.clear()
 async def test_user_provider_analytics_aggregate_across_stories(
    db_session,
    auth_token,
    degraded_story_with_text,
    test_story,
 ):
    async def override_get_db():
        yield db_session
    app.dependency_overrides[get_db] = override_get_db
    image_job = await create_generation_job(
        db_session,
        user_id=degraded_story_with_text.user_id,
        output_mode="asset_retry",
        input_type="image",
        request_payload={"assets": ["image"]},
        story_id=degraded_story_with_text.id,
    )
    await record_generation_event(
        db_session,
        job=image_job,
        story_id=degraded_story_with_text.id,
        event_type="provider_call_succeeded",
        status="succeeded",
        metadata={
            "capability": "image",
            "adapter": "demo",
            "strategy": "priority",
            "latency_ms": 42,
            "estimated_cost_usd": 0.01,
        },
    )
    await record_generation_event(
        db_session,
        job=image_job,
        story_id=degraded_story_with_text.id,
        event_type="provider_call_failed",
        status="failed",
        metadata={
            "capability": "image",
            "adapter": "cqtai",
            "strategy": "priority",
            "latency_ms": 120,
            "error": "timeout",
        },
    )
    audio_job = await create_generation_job(
        db_session,
        user_id=test_story.user_id,
        output_mode="asset_retry",
        input_type="audio",
        request_payload={"assets": ["audio"]},
        story_id=test_story.id,
    )
    await record_generation_event(
        db_session,
        job=audio_job,
        story_id=test_story.id,
        event_type="provider_call_succeeded",
        status="succeeded",
        metadata={
            "capability": "tts",
            "adapter": "edge_tts",
            "strategy": "priority",
            "latency_ms": 18,
            "estimated_cost_usd": 0.003,
        },
    )
    transport = ASGITransport(app=app)
    try:
        async with AsyncClient(transport=transport, base_url="http://test") as client:
            client.cookies.set("access_token", auth_token)
            response = await client.get("/api/generations/provider-analytics")
        assert response.status_code == 200
        data = response.json()
        assert data["job_count"] == 2
        assert data["story_count"] == 2
        assert data["total_calls"] == 3
        assert data["successful_calls"] == 2
        assert data["failed_calls"] == 1
        assert data["avg_latency_ms"] == 60.0
        assert data["estimated_cost_usd"] == 0.013
        assert data["by_provider"] == [
            {
                "capability": "image",
                "adapter": "cqtai",
                "call_count": 1,
                "success_count": 0,
                "failure_count": 1,
                "avg_latency_ms": 120.0,
                "estimated_cost_usd": 0.0,
            },
            {
                "capability": "image",
                "adapter": "demo",
                "call_count": 1,
                "success_count": 1,
                "failure_count": 0,
                "avg_latency_ms": 42.0,
                "estimated_cost_usd": 0.01,
            },
            {
                "capability": "tts",
                "adapter": "edge_tts",
                "call_count": 1,
                "success_count": 1,
                "failure_count": 0,
                "avg_latency_ms": 18.0,
                "estimated_cost_usd": 0.003,
            },
        ]
    finally:
        app.dependency_overrides.clear()
--- a/docs/planning/demo-checklist.md
+++ b/docs/planning/demo-checklist.md
@@ -56,6 +56,7 @@ SMOKE_AUDIO=1 ./scripts/demo_smoke.sh
 - [ ] 普通故事 provider stats 返回成功率、耗时和成本字段
 - [ ] 普通故事封面 retry 后 `image_status=ready`
 - [ ] 故事详情页能看到生成轨迹和 Provider 调用结果
 - [ ] 故事库能看到跨故事 Provider 运营摘要
 - [ ] `/api/generations` 能生成绘本
 - [ ] 绘本生成响应返回 `generation_job_id`，且 story job history 可查询
 - [ ] 绘本 provider stats 返回成功率、耗时和成本字段
@@ -123,7 +124,7 @@ DreamWeaver 是面向 3-8 岁亲子场景的个性化 AI 绘本与陪伴式讲
 ### 2:20 - 3:00 取舍与下一步
-求职版优先稳定闭环和可解释性，不做支付、多租户和复杂监控。现在 job/event 已能查询 workflow、资产补全、provider 调用轨迹和聚合指标，用户端和管理端也能展示生成轨迹；下一步会迁移到后台 worker 和进度轮询。
+求职版优先稳定闭环和可解释性，不做支付、多租户和复杂监控。现在 job/event 已能查询 workflow、资产补全、provider 调用轨迹和聚合指标，用户端和管理端也能展示生成轨迹与跨故事 Provider 运营摘要；下一步会迁移到后台 worker。
 ---
--- a/docs/planning/demo-validation-log.md
+++ b/docs/planning/demo-validation-log.md
@@ -6,6 +6,10 @@
 补充验证：
 - 新增跨故事 Provider analytics 后，`backend/.venv/bin/python -m pytest backend/tests -q` 通过，83 个测试通过。
 - 用户端与管理端 `npm run build` 均通过；生成轨迹组件已支持未终止任务自动轮询。
 - `docker compose up -d --build` 已再次用当前代码重建本地演示栈。
 - `./scripts/demo_smoke.sh` 再次通过，并新增断言 `GET /api/generations/provider-analytics` 可以返回跨故事总调用、成功率、任务数、故事数和 Provider 明细。
 - 后端新增 `partial_ready`、`text_status` 与迁移 `0012_story_text_status` 后，`backend/.venv/bin/python -m pytest backend/tests -q` 通过，82 个测试通过。
 - `backend/.venv/bin/python -m ruff check backend/app backend/tests backend/alembic/versions/0012_add_story_text_status_and_partial_ready.py` 通过。
 - 用户端与管理端 `npm run build` 均通过。
--- a/docs/product/unified-generation-workflow-prd.md
+++ b/docs/product/unified-generation-workflow-prd.md
@@ -63,6 +63,8 @@ DreamWeaver 当前同时支持普通故事生成、完整故事生成和绘本
 - Provider failover 已记录到 job event，包含 capability、adapter、strategy、latency 和 estimated cost
 - Provider 调用已可按故事聚合为成功率、平均耗时、预估成本和 adapter 明细
 - generation job 响应已提供 `progress_percent`、`progress_label` 和 `is_terminal`，前端可直接用于进度条和轮询
 - 已新增跨故事 Provider 运营摘要 `GET /api/generations/provider-analytics`，故事库可展示总调用、成功率、平均耗时、预估成本和任务/故事覆盖数
 - 用户端与管理端生成轨迹组件会在任务未终止时自动轮询，为后续后台 worker 进度流保留前端形态
 - `POST /api/generations` 响应已返回 `generation_job_id`，smoke 脚本会验证 job 查询与 story job history
 - 用户端与管理端的故事详情页、绘本阅读页已接入生成轨迹，展示生成/重试任务、关键事件、Provider 调用结果和聚合指标
 - 故事详情页封面补全已切换到统一资产重试入口
@@ -72,11 +74,11 @@ DreamWeaver 当前同时支持普通故事生成、完整故事生成和绘本
 - 普通故事、完整生成、绘本生成已有统一外部入口，内部 workflow 仍可继续减少兼容层分支
 - 统一资产重试入口已覆盖普通故事封面、绘本缺失插图和故事音频，后续可继续扩展更细的资产级审计
- 后台异步 worker 进度流、跨故事 Provider 运营分析和断点续跑仍属于后续生产化增强
+- 后台异步 worker 执行、断点续跑、跨时间窗口筛选和更完整的 Provider 运营分析仍属于后续生产化增强
 ### What This Means
-这份 PRD 仍然保留目标态设计，但主干能力已经可在当前代码中演示。当前最适合的继续方式，是继续把同步请求迁移到可复用的后台任务与运营分析视角，而不是继续扩大功能范围。
+这份 PRD 仍然保留目标态设计，但主干能力已经可在当前代码中演示。当前最适合的继续方式，是继续把同步请求迁移到后台 worker，并把当前首版运营摘要扩展为可筛选、可对比的分析视角，而不是继续扩大功能范围。
 ---
@@ -87,7 +89,7 @@ DreamWeaver 当前同时支持普通故事生成、完整故事生成和绘本
 DreamWeaver 当前存在以下工作流层面问题：
 1. **生成入口已建立，内部路径正在收束**
-   当前前端已切到 `/api/generations`，旧的 `/api/stories/generate`、`/api/stories/generate/full`、`/api/storybook/generate` 仍作为兼容入口保留。service 内部已抽取上下文准备、主记录保存、封面补全、绘本插图补全和音频补全 helper，并用 `AssetCompletionResult` 表达资产补全结果。generation job/event 已落库并可查询，Provider 调用轨迹和聚合指标也已进入用户端与管理端展示。下一步重点是为后台异步 worker 与运营成本分析复用这些事件。
+   当前前端已切到 `/api/generations`，旧的 `/api/stories/generate`、`/api/stories/generate/full`、`/api/storybook/generate` 仍作为兼容入口保留。service 内部已抽取上下文准备、主记录保存、封面补全、绘本插图补全和音频补全 helper，并用 `AssetCompletionResult` 表达资产补全结果。generation job/event 已落库并可查询，Provider 调用轨迹、单故事聚合指标和跨故事运营摘要也已进入用户端与管理端展示。下一步重点是为后台异步 worker 复用这些事件。
 2. **保存与资产补全过程正在统一**
   文本故事和绘本已拥有更清晰的主记录保存 helper；普通故事封面、绘本缺失插图、故事音频生成/缓存已共用各自的 asset completion helper。服务层已经能表达资产任务结果，并会把统一入口、资产重试、绘本逐页插图和音频生成的关键节点写入 job event。
--- a/docs/technical/generation-job-state.md
+++ b/docs/technical/generation-job-state.md
@@ -19,8 +19,9 @@
 - `GET /api/generations/jobs/{job_id}`：查询单次生成/补全任务及其事件流。
 - `GET /api/generations/{story_id}/jobs`：查询某个故事或绘本的生成与重试历史。
 - `GET /api/generations/{story_id}/provider-stats`：按故事聚合 Provider 调用成功率、平均耗时、预估成本和 adapter 明细。
 - `GET /api/generations/provider-analytics`：按当前用户聚合跨故事 Provider 调用、任务数、故事数、成功率、平均耗时和预估成本。
-job 响应会返回 `progress_percent`、`progress_label` 和 `is_terminal`，用户端与管理端已经消费这些查询入口，在故事详情页和绘本阅读页展示最近任务、任务历史、事件时间线、进度条和 Provider 聚合指标。
+job 响应会返回 `progress_percent`、`progress_label` 和 `is_terminal`，用户端与管理端已经消费这些查询入口，在故事详情页和绘本阅读页展示最近任务、任务历史、事件时间线、进度条和 Provider 聚合指标；当任务未终止时，前端会自动轮询，为后台 worker 进度流预留体验形态。
 ## 现有状态模型
@@ -50,9 +51,8 @@ job 响应会返回 `progress_percent`、`progress_label` 和 `is_terminal`，
 当前已有两层记录，未来可以继续扩展字段和事件颗粒度：
- 将 job/event 查询继续接入真正异步生成时的进度条。
+- 将同步生成请求迁移到真正异步 worker 后，继续复用现有 job 查询和前端轮询进度条。
- 将当前按故事聚合的 provider 指标扩展为跨用户、跨时间窗口的运营分析。
+- 将当前跨故事 provider 指标扩展为跨时间窗口、跨用户和失败原因维度的运营分析。
 - 将当前同步生成请求迁移到后台 worker 后，复用现有 job 查询接口做轮询进度。
 ## 面试表达
--- a/frontend/src/components/GenerationTrace.vue
+++ b/frontend/src/components/GenerationTrace.vue
@@ -1,5 +1,5 @@
 <script setup lang="ts">
-import { computed, ref, watch } from 'vue'
+import { computed, onBeforeUnmount, ref, watch } from 'vue'
 import { BoltIcon, ClockIcon } from '@heroicons/vue/24/outline'
 import { api } from '../api/client'
 import type {
@@ -29,12 +29,18 @@ const activeJob = ref<GenerationJobDetail | null>(null)
 const providerStats = ref<GenerationProviderStats | null>(null)
 const loading = ref(false)
 const error = ref('')
 let refreshTimer: ReturnType<typeof setInterval> | null = null
 const isDark = computed(() => props.tone === 'dark')
 const latestJob = computed(() => jobHistory.value[0] ?? null)
 const activeJobEvents = computed(() => activeJob.value?.events.slice(-10) ?? [])
 const activeProgress = computed(() => activeJob.value?.progress_percent ?? latestJob.value?.progress_percent ?? 0)
 const activeProgressLabel = computed(() => activeJob.value?.progress_label ?? latestJob.value?.progress_label ?? '暂无进度')
 const shouldAutoRefresh = computed(() => {
  if (activeJob.value) return !activeJob.value.is_terminal
  if (latestJob.value) return !latestJob.value.is_terminal
  return false
 })
 const providerSuccessRate = computed(() => {
  if (!providerStats.value?.total_calls) return null
  return Math.round((providerStats.value.successful_calls / providerStats.value.total_calls) * 100)
@@ -195,6 +201,13 @@ async function refresh() {
  }
 }
 function stopAutoRefresh() {
  if (refreshTimer) {
    clearInterval(refreshTimer)
    refreshTimer = null
  }
 }
 watch(
  () => props.storyId,
  () => {
@@ -203,6 +216,19 @@ watch(
  { immediate: true },
 )
 watch(shouldAutoRefresh, (enabled) => {
  stopAutoRefresh()
  if (enabled) {
    refreshTimer = setInterval(() => {
      if (!loading.value) {
        void refresh()
      }
    }, 2500)
  }
 })
 onBeforeUnmount(stopAutoRefresh)
 defineExpose({ refresh })
 </script>
--- a/frontend/src/types/generation.ts
+++ b/frontend/src/types/generation.ts
@@ -49,3 +49,14 @@ export interface GenerationProviderStats {
  estimated_cost_usd: number
  by_provider: GenerationProviderStat[]
 }
 export interface GenerationProviderAnalytics {
  total_calls: number
  successful_calls: number
  failed_calls: number
  avg_latency_ms: number | null
  estimated_cost_usd: number
  job_count: number
  story_count: number
  by_provider: GenerationProviderStat[]
 }
--- a/frontend/src/views/MyStories.vue
+++ b/frontend/src/views/MyStories.vue
@@ -7,6 +7,7 @@ import BaseButton from '../components/ui/BaseButton.vue'
 import BaseCard from '../components/ui/BaseCard.vue'
 import EmptyState from '../components/ui/EmptyState.vue'
 import LoadingSpinner from '../components/ui/LoadingSpinner.vue'
 import type { GenerationProviderAnalytics } from '../types/generation'
 import {
  getAssetStatusMeta,
  getGenerationStatusMeta,
@@ -37,6 +38,7 @@ interface StoryItem {
 const router = useRouter()
 const stories = ref<StoryItem[]>([])
 const providerAnalytics = ref<GenerationProviderAnalytics | null>(null)
 const loading = ref(true)
 const error = ref('')
 const showCreateModal = ref(false)
@@ -48,10 +50,22 @@ const readableCount = computed(() =>
 const attentionCount = computed(() =>
  stories.value.filter((story) => needsGenerationAttention(story.generation_status)).length,
 )
 const providerSuccessRate = computed(() => {
  if (!providerAnalytics.value?.total_calls) return null
  return Math.round(
    (providerAnalytics.value.successful_calls / providerAnalytics.value.total_calls) * 100,
  )
 })
 const topProvider = computed(() => providerAnalytics.value?.by_provider[0] ?? null)
 async function fetchStories() {
  try {
-    stories.value = await api.get<StoryItem[]>('/api/stories')
+    const [storyList, analytics] = await Promise.all([
      api.get<StoryItem[]>('/api/stories'),
      api.get<GenerationProviderAnalytics>('/api/generations/provider-analytics'),
    ])
    stories.value = storyList
    providerAnalytics.value = analytics
  } catch (e) {
    error.value = e instanceof Error ? e.message : '加载失败'
  } finally {
@@ -84,6 +98,14 @@ function getStoryLink(story: StoryItem) {
  return story.mode === 'storybook' ? `/storybook/view/${story.id}` : `/story/${story.id}`
 }
 function formatLatency(value?: number | null) {
  return typeof value === 'number' ? `${Math.round(value)}ms` : '暂无'
 }
 function formatCost(value?: number | null) {
  return typeof value === 'number' ? `$${value.toFixed(4)}` : '$0.0000'
 }
 onMounted(() => {
  void fetchStories()
@@ -158,6 +180,42 @@ onMounted(() => {
        </div>
      </BaseCard>
      <BaseCard
        v-if="providerAnalytics?.total_calls"
        class="mb-8"
        padding="lg"
      >
        <div class="flex flex-col gap-5 lg:flex-row lg:items-center lg:justify-between">
          <div>
            <h2 class="text-xl font-bold text-gray-800">Provider 运营摘要</h2>
            <p class="mt-2 text-sm leading-6 text-gray-500">
              最近生成和资源补全留下的供应商调用轨迹。
            </p>
          </div>
          <div class="grid grid-cols-2 gap-3 sm:grid-cols-4 lg:min-w-[520px]">
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">成功率</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ providerSuccessRate }}%</div>
            </div>
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">平均耗时</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ formatLatency(providerAnalytics.avg_latency_ms) }}</div>
            </div>
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">预估成本</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ formatCost(providerAnalytics.estimated_cost_usd) }}</div>
            </div>
            <div class="rounded-lg border border-gray-100 bg-gray-50 px-3 py-3">
              <div class="text-xs text-gray-500">调用次数</div>
              <div class="mt-1 text-lg font-semibold text-gray-800">{{ providerAnalytics.total_calls }}</div>
            </div>
          </div>
        </div>
        <p v-if="topProvider" class="mt-4 text-sm text-gray-500">
          当前样本中最前面的能力组合是 {{ topProvider.capability }} / {{ topProvider.adapter }}，成功 {{ topProvider.success_count }} 次，失败 {{ topProvider.failure_count }} 次。
        </p>
      </BaseCard>
      <div class="grid grid-cols-1 sm:grid-cols-2 lg:grid-cols-3 gap-6">
        <router-link
          v-for="story in stories"
--- a/scripts/demo_smoke.sh
+++ b/scripts/demo_smoke.sh
@@ -153,6 +153,11 @@ assert_jq "$storybook_jobs_json" 'length >= 2 and (map(.id) | index("'"$storyboo
 echo "$story_jobs_json" | jq '[.[] | {id,output_mode,status,current_step}]'
 echo "$storybook_jobs_json" | jq '[.[] | {id,output_mode,status,current_step}]'
 say "Checking cross-story provider analytics"
 provider_analytics_json="$(get_json "$APP_URL/api/generations/provider-analytics")"
 assert_jq "$provider_analytics_json" '.total_calls >= 2 and .successful_calls >= 2 and .job_count >= 4 and .story_count >= 2 and (.by_provider | length) >= 1' "provider analytics should summarize calls across generated stories"
 echo "$provider_analytics_json" | jq '{total_calls,successful_calls,failed_calls,job_count,story_count,avg_latency_ms,estimated_cost_usd}'
 say "Checking story list"
 list_json="$(get_json "$APP_URL/api/stories?limit=5")"
 assert_jq "$list_json" "map(.id) | index($story_id) != null" "story list should include generated story"