api/routers/transcribe/sessions.py
Kevin Carter 36ae76143f Phase 3B: Implement pluggable LLM client for summary generation
- Create llm_client.py with 5 provider implementations (Anthropic, OpenAI, Ollama, OpenRouter, Google)
- Add build_prompt() helper to construct system/user prompts from templates
- Wire up POST /transcribe/sessions/{id}/summaries endpoint to call LLM client
- Return generated content + token counts (input_tokens, output_tokens)
- API keys passed per-request, never stored or logged
- Uses prompt templates from prompts.py based on summary_type
2026-05-20 22:20:19 +00:00

356 lines
13 KiB
Python

"""Transcription sessions router — CRUD endpoints for transcription sessions and segments."""
from fastapi import APIRouter, Depends, HTTPException, Query
from typing import Optional, List
from datetime import datetime
from modules.auth.supabase_bearer import SupabaseBearer
from modules.transcription.models import (
TranscriptionSessionCreate,
TranscriptionSessionUpdate,
TranscriptionSessionResponse,
SessionListResponse,
TranscriptionSegmentCreate,
TranscriptionSegmentResponse,
SummaryGenerateRequest,
SummaryResponse,
ExportFormat,
)
from modules.transcription.llm_client import call_llm, build_prompt
import logging
logger = logging.getLogger(__name__)
router = APIRouter()
def get_supabase_client():
"""Get Supabase service role client."""
from modules.database.supabase.utils.client import SupabaseServiceRoleClient
return SupabaseServiceRoleClient()
def get_user_id(credentials=Depends(SupabaseBearer())) -> str:
"""Extract user_id from Supabase JWT token."""
return credentials.get("sub", credentials.get("user_id", ""))
@router.post("/sessions", response_model=TranscriptionSessionResponse)
async def create_session(
session_data: TranscriptionSessionCreate,
user_id: str = Depends(get_user_id),
):
"""Create a new transcription session."""
supabase = get_supabase_client()
data = {
"user_id": user_id,
"title": session_data.title,
"canvas_type": session_data.canvas_type,
}
result = supabase.supabase.table("transcription_sessions").insert(data).execute()
if not result.data:
raise HTTPException(status_code=500, detail="Failed to create session")
return result.data[0]
@router.patch("/sessions/{session_id}", response_model=TranscriptionSessionResponse)
async def update_session(
session_id: str,
update_data: TranscriptionSessionUpdate,
user_id: str = Depends(get_user_id),
):
"""Update a transcription session (end, tag, title)."""
supabase = get_supabase_client()
# Verify ownership
existing = supabase.supabase.table("transcription_sessions").select("*").eq("id", session_id).eq("user_id", user_id).execute()
if not existing.data:
raise HTTPException(status_code=404, detail="Session not found")
# Build update dict (only non-None fields)
updates = {k: v for k, v in update_data.model_dump().items() if v is not None}
updates["updated_at"] = datetime.utcnow().isoformat()
result = supabase.supabase.table("transcription_sessions").update(updates).eq("id", session_id).execute()
if not result.data:
raise HTTPException(status_code=500, detail="Failed to update session")
return result.data[0]
@router.get("/sessions", response_model=SessionListResponse)
async def list_sessions(
user_id: str = Depends(get_user_id),
page: int = Query(1, ge=1),
page_size: int = Query(20, ge=1, le=100),
timetable_period_id: Optional[str] = None,
):
"""List transcription sessions for the current user (paginated)."""
supabase = get_supabase_client()
query = supabase.supabase.table("transcription_sessions").select("*", count="exact").eq("user_id", user_id)
if timetable_period_id:
query = query.eq("timetable_period_id", timetable_period_id)
query = query.order("started_at", desc=True).range((page - 1) * page_size, page * page_size - 1)
result = query.execute()
return SessionListResponse(
sessions=result.data,
total=result.count or 0,
page=page,
page_size=page_size,
)
@router.get("/sessions/{session_id}", response_model=dict)
async def get_session(
session_id: str,
user_id: str = Depends(get_user_id),
):
"""Get a session with its segments and summaries."""
supabase = get_supabase_client()
# Get session
session_result = supabase.supabase.table("transcription_sessions").select("*").eq("id", session_id).eq("user_id", user_id).execute()
if not session_result.data:
raise HTTPException(status_code=404, detail="Session not found")
# Get segments
segments_result = supabase.supabase.table("transcription_segments").select("*").eq("session_id", session_id).order("sequence_index").execute()
# Get summaries
summaries_result = supabase.supabase.table("transcription_summaries").select("*").eq("session_id", session_id).execute()
return {
"session": session_result.data[0],
"segments": segments_result.data,
"summaries": summaries_result.data,
}
@router.delete("/sessions/{session_id}")
async def delete_session(
session_id: str,
user_id: str = Depends(get_user_id),
):
"""Soft delete a transcription session."""
supabase = get_supabase_client()
# Verify ownership
existing = supabase.supabase.table("transcription_sessions").select("*").eq("id", session_id).eq("user_id", user_id).execute()
if not existing.data:
raise HTTPException(status_code=404, detail="Session not found")
# Soft delete: set ended_at and mark metadata
result = supabase.supabase.table("transcription_sessions").update({
"ended_at": datetime.utcnow().isoformat(),
"metadata": {"deleted": True},
}).eq("id", session_id).execute()
return {"message": "Session deleted"}
@router.post("/sessions/{session_id}/segments")
async def upsert_segments(
session_id: str,
segments: List[TranscriptionSegmentCreate],
user_id: str = Depends(get_user_id),
):
"""Batch upsert segments for a session."""
supabase = get_supabase_client()
# Verify session exists and user owns it
session_check = supabase.supabase.table("transcription_sessions").select("id").eq("id", session_id).eq("user_id", user_id).execute()
if not session_check.data:
raise HTTPException(status_code=404, detail="Session not found")
# Batch insert segments
segment_data = [s.model_dump() for s in segments]
if segment_data:
result = supabase.supabase.table("transcription_segments").insert(segment_data).execute()
# Update segment count on session
supabase.supabase.table("transcription_sessions").update({
"segment_count": len(segment_data),
}).eq("id", session_id).execute()
return {"message": f"Upserted {len(segment_data)} segments", "count": len(segment_data)}
@router.get("/sessions/{session_id}/segments", response_model=List[TranscriptionSegmentResponse])
async def list_segments(
session_id: str,
user_id: str = Depends(get_user_id),
):
"""List all segments for a session."""
supabase = get_supabase_client()
# Verify ownership
session_check = supabase.supabase.table("transcription_sessions").select("id").eq("id", session_id).eq("user_id", user_id).execute()
if not session_check.data:
raise HTTPException(status_code=404, detail="Session not found")
result = supabase.supabase.table("transcription_segments").select("*").eq("session_id", session_id).order("sequence_index").execute()
return result.data
@router.post("/sessions/{session_id}/summaries", response_model=SummaryResponse)
async def generate_summary(
session_id: str,
summary_request: SummaryGenerateRequest,
user_id: str = Depends(get_user_id),
):
"""Generate a summary for a session using the specified LLM provider.
Phase 3: Full implementation — calls the pluggable LLM client with
prompt templates from prompts.py. API key is passed per-request and
never stored or logged.
"""
supabase = get_supabase_client()
# Verify session exists and user owns it
session_check = supabase.supabase.table("transcription_sessions").select("*").eq("id", session_id).eq("user_id", user_id).execute()
if not session_check.data:
raise HTTPException(status_code=404, detail="Session not found")
session = session_check.data[0]
# Build transcript from segments (or use segment range)
segments_query = supabase.supabase.table("transcription_segments").select("*").eq("session_id", session_id).order("sequence_index")
segments_result = segments_query.execute()
if not segments_result.data:
raise HTTPException(status_code=400, detail="No segments found for this session")
# Apply segment range filter if specified
segments = segments_result.data
if summary_request.segment_range and len(summary_request.segment_range) == 2:
start_idx, end_idx = summary_request.segment_range[0], summary_request.segment_range[1]
if start_idx is not None and end_idx is not None:
segments = segments[start_idx:end_idx]
elif start_idx is not None:
segments = segments[start_idx:]
elif end_idx is not None:
segments = segments[:end_idx]
# Build full transcript text from segments
transcript_parts = [s["text"] for s in segments if s.get("text")]
transcript = "\n".join(transcript_parts)
if not transcript.strip():
raise HTTPException(status_code=400, detail="Transcript is empty — cannot generate summary")
# Build prompt from template
system_prompt, user_message = build_prompt(summary_request.summary_type, transcript)
# Call the LLM client
try:
llm_result = await call_llm(
provider=summary_request.provider,
model=summary_request.model,
api_key=summary_request.api_key,
system_prompt=system_prompt,
user_message=user_message,
)
except Exception as e:
logger.error(f"LLM call failed: {e}")
raise HTTPException(status_code=502, detail=f"LLM generation failed: {str(e)}")
# Determine segment range for storage
seg_start = None
seg_end = None
if summary_request.segment_range and len(summary_request.segment_range) == 2:
seg_start = summary_request.segment_range[0]
seg_end = summary_request.segment_range[1]
# Build the prompt that was used (for audit trail)
prompt_used = f"{system_prompt}\n\n{user_message}" if summary_request.summary_type != "segment" else user_message
# Save summary to database
summary_data = {
"session_id": session_id,
"user_id": user_id,
"summary_type": summary_request.summary_type,
"content": llm_result.content,
"prompt_used": prompt_used,
"llm_provider": summary_request.provider,
"llm_model": summary_request.model,
"input_tokens": llm_result.input_tokens,
"output_tokens": llm_result.output_tokens,
"segment_range_start": seg_start,
"segment_range_end": seg_end,
}
result = supabase.supabase.table("transcription_summaries").insert(summary_data).execute()
if not result.data:
raise HTTPException(status_code=500, detail="Failed to save summary")
return result.data[0]
@router.get("/sessions/{session_id}/summaries", response_model=List[SummaryResponse])
async def list_summaries(
session_id: str,
user_id: str = Depends(get_user_id),
):
"""List summaries for a session."""
supabase = get_supabase_client()
# Verify ownership
session_check = supabase.supabase.table("transcription_sessions").select("id").eq("id", session_id).eq("user_id", user_id).execute()
if not session_check.data:
raise HTTPException(status_code=404, detail="Session not found")
result = supabase.supabase.table("transcription_summaries").select("*").eq("session_id", session_id).execute()
return result.data
@router.post("/sessions/{session_id}/export")
async def export_session(
session_id: str,
export_format: ExportFormat,
user_id: str = Depends(get_user_id),
):
"""Export session as SRT, TXT, or JSON (Phase 1 stub)."""
supabase = get_supabase_client()
# Verify ownership
session_check = supabase.supabase.table("transcription_sessions").select("id").eq("id", session_id).eq("user_id", user_id).execute()
if not session_check.data:
raise HTTPException(status_code=404, detail="Session not found")
# Get segments
segments_result = supabase.supabase.table("transcription_segments").select("*").eq("session_id", session_id).order("sequence_index").execute()
segments = segments_result.data
if export_format.format == "srt":
# Phase 1 stub — implement in Phase 3
return {"format": "srt", "content": "[TODO: Generate SRT from segments]"}
elif export_format.format == "txt":
text = "\n".join(s["text"] for s in segments)
return {"format": "txt", "content": text}
elif export_format.format == "json":
return {"format": "json", "content": {"segments": segments}}
else:
raise HTTPException(status_code=400, detail=f"Unsupported format: {export_format.format}")