leaudit-platform-backend/fastapi_modules/fastapi_leaudit/rag_engine/question_chains.py

from __future__ import annotations

import json

import httpx

from fastapi_modules.fastapi_leaudit.rag_engine.config import RAG_CONFIG, build_openai_chat_completions_url


async def generate_followups(query: str, answer: str) -> list[str]:
    prompt = (
        "基于用户问题和已有回答，生成 3 个适合继续追问的简短问题。"
        "仅返回 JSON 数组字符串，例如 [\"问题1\", \"问题2\"]。\\n"
        f"用户问题: {query}\\n回答: {answer[:1200]}"
    )
    async with httpx.AsyncClient(timeout=30.0) as client:
        resp = await client.post(
            build_openai_chat_completions_url(RAG_CONFIG["LLM_BASE_URL"]),
            json={
                "model": RAG_CONFIG["LLM_MODEL"],
                "messages": [{"role": "user", "content": prompt}],
                "temperature": 0.5,
                "max_tokens": 256,
                "chat_template_kwargs": {"enable_thinking": False},
            },
            headers={
                "Content-Type": "application/json",
                "Authorization": f"Bearer {RAG_CONFIG['LLM_API_KEY']}",
            },
        )
        resp.raise_for_status()
        content = resp.json()["choices"][0]["message"]["content"]
    try:
        parsed = json.loads(content)
        if isinstance(parsed, list):
            return [str(item).strip() for item in parsed if str(item).strip()][:3]
    except Exception:
        pass
    return [line.strip("- 1234567890.\t") for line in content.splitlines() if line.strip()][:3]