125 lines
3.8 KiB
Python
125 lines
3.8 KiB
Python
from __future__ import annotations
|
|
|
|
import base64
|
|
import json
|
|
import os
|
|
from pathlib import Path
|
|
from typing import Any
|
|
|
|
import httpx
|
|
from dotenv import load_dotenv
|
|
|
|
from helpers import summarize_error
|
|
|
|
load_dotenv()
|
|
|
|
OPENROUTER_BASE = "https://openrouter.ai/api/v1"
|
|
|
|
|
|
def _api_key() -> str:
|
|
return os.getenv("OPENROUTER_API_KEY", "")
|
|
|
|
|
|
def _auth_headers() -> dict[str, str]:
|
|
api_key = _api_key()
|
|
if not api_key:
|
|
raise ValueError("OPENROUTER_API_KEY not set")
|
|
return {
|
|
"Authorization": f"Bearer {api_key}",
|
|
}
|
|
|
|
|
|
def _audio_format(audio_path: str) -> str:
|
|
suffix = Path(audio_path).suffix.lower().lstrip(".")
|
|
return suffix or "wav"
|
|
|
|
|
|
def _build_transcription_payload(audio_path: str) -> dict[str, Any]:
|
|
with open(audio_path, "rb") as audio_file:
|
|
encoded = base64.b64encode(audio_file.read()).decode("ascii")
|
|
|
|
return {
|
|
"model": "openai/whisper-large-v3",
|
|
"input_audio": {
|
|
"data": encoded,
|
|
"format": _audio_format(audio_path),
|
|
},
|
|
}
|
|
|
|
|
|
async def transcribe(audio_path: str) -> str:
|
|
"""Send audio to OpenRouter's whisper model and return transcript text."""
|
|
headers = _auth_headers()
|
|
headers["Content-Type"] = "application/json"
|
|
|
|
async with httpx.AsyncClient(timeout=300) as client:
|
|
resp = await client.post(
|
|
f"{OPENROUTER_BASE}/audio/transcriptions",
|
|
headers=headers,
|
|
content=json.dumps(_build_transcription_payload(audio_path)),
|
|
)
|
|
try:
|
|
resp.raise_for_status()
|
|
except httpx.HTTPStatusError as exc:
|
|
detail = summarize_error(_safe_json(resp), fallback=resp.text)
|
|
raise RuntimeError(f"OpenRouter transcription failed: {detail}") from exc
|
|
|
|
data = resp.json()
|
|
text = data.get("text", "")
|
|
if not text.strip():
|
|
raise RuntimeError("OpenRouter transcription returned empty text")
|
|
return text.strip()
|
|
|
|
|
|
async def summarize(transcript: str) -> str:
|
|
"""Send transcript to DeepSeek via OpenRouter and return structured meeting summary."""
|
|
prompt = f"""You are a meeting summarizer. Given the following meeting transcript, produce a concise, well-structured summary with:
|
|
|
|
1. **Overview** — 2-3 sentences covering what was discussed
|
|
2. **Key Decisions** — decisions that were made
|
|
3. **Action Items** — who needs to do what (use bullet points)
|
|
4. **Next Steps / Deadlines** — any dates, timelines, or follow-ups mentioned
|
|
|
|
If speaker labels are present, preserve them where helpful in action items.
|
|
|
|
Transcript:
|
|
{transcript[:16000]}"""
|
|
|
|
body = {
|
|
"model": "@preset/cheap-deepseek-v4-flash",
|
|
"messages": [{"role": "user", "content": prompt}],
|
|
"max_tokens": 1500,
|
|
}
|
|
|
|
headers = _auth_headers()
|
|
headers["Content-Type"] = "application/json"
|
|
|
|
async with httpx.AsyncClient(timeout=180) as client:
|
|
resp = await client.post(
|
|
f"{OPENROUTER_BASE}/chat/completions",
|
|
headers=headers,
|
|
json=body,
|
|
)
|
|
try:
|
|
resp.raise_for_status()
|
|
except httpx.HTTPStatusError as exc:
|
|
detail = summarize_error(_safe_json(resp), fallback=resp.text)
|
|
raise RuntimeError(f"OpenRouter summarization failed: {detail}") from exc
|
|
|
|
data = resp.json()
|
|
try:
|
|
content = data["choices"][0]["message"]["content"]
|
|
except (KeyError, IndexError, TypeError) as exc:
|
|
raise RuntimeError("Unexpected OpenRouter summarization response shape") from exc
|
|
|
|
if not isinstance(content, str) or not content.strip():
|
|
raise RuntimeError("OpenRouter summarization returned empty content")
|
|
return content.strip()
|
|
|
|
|
|
def _safe_json(resp: httpx.Response) -> Any:
|
|
try:
|
|
return resp.json()
|
|
except Exception:
|
|
return None
|