126 lines
4.5 KiB
Python
126 lines
4.5 KiB
Python
import logging
|
|
import asyncio
|
|
from typing import Any, Dict, List
|
|
|
|
from fastapi import APIRouter, Depends, HTTPException
|
|
from sqlalchemy.orm import Session
|
|
|
|
from app.core.config import settings
|
|
from app.core.security import get_current_user
|
|
from app.db.session import get_db
|
|
from app.models.knowledge import Document, KnowledgeBase
|
|
from app.models.user import User
|
|
from app.schemas.testing import TestingPipelineRequest, TestingPipelineResponse
|
|
from app.services.embedding.embedding_factory import EmbeddingsFactory
|
|
from app.services.retrieval.multi_kb_retriever import MultiKBRetriever, format_retrieval_context
|
|
from app.services.testing_pipeline import run_testing_pipeline
|
|
from app.services.vector_store import VectorStoreFactory
|
|
|
|
router = APIRouter()
|
|
logger = logging.getLogger(__name__)
|
|
MODEL_PIPELINE_TIMEOUT_SECONDS = 300
|
|
|
|
|
|
async def _build_kb_vector_stores(db: Session, knowledge_bases: List[KnowledgeBase]) -> List[Dict[str, Any]]:
|
|
embeddings = EmbeddingsFactory.create()
|
|
kb_vector_stores: List[Dict[str, Any]] = []
|
|
|
|
for kb in knowledge_bases:
|
|
documents = db.query(Document).filter(Document.knowledge_base_id == kb.id).all()
|
|
if not documents:
|
|
continue
|
|
|
|
store = VectorStoreFactory.create(
|
|
store_type=settings.VECTOR_STORE_TYPE,
|
|
collection_name=f"kb_{kb.id}",
|
|
embedding_function=embeddings,
|
|
)
|
|
kb_vector_stores.append({"kb_id": kb.id, "store": store})
|
|
|
|
return kb_vector_stores
|
|
|
|
|
|
@router.post("/generate", response_model=TestingPipelineResponse)
|
|
async def generate_testing_content(
|
|
*,
|
|
payload: TestingPipelineRequest,
|
|
current_user: User = Depends(get_current_user),
|
|
db: Session = Depends(get_db),
|
|
) -> Any:
|
|
_ = current_user
|
|
|
|
knowledge_context = (payload.knowledge_context or "").strip()
|
|
if payload.knowledge_base_ids:
|
|
try:
|
|
knowledge_bases = (
|
|
db.query(KnowledgeBase)
|
|
.filter(
|
|
KnowledgeBase.id.in_(payload.knowledge_base_ids),
|
|
KnowledgeBase.user_id == current_user.id,
|
|
)
|
|
.all()
|
|
)
|
|
|
|
kb_vector_stores = await _build_kb_vector_stores(db, knowledge_bases)
|
|
if kb_vector_stores:
|
|
retriever = MultiKBRetriever(
|
|
reranker_weight=settings.RERANKER_WEIGHT,
|
|
)
|
|
retrieval_rows = await retriever.retrieve(
|
|
query=payload.requirement_text,
|
|
kb_vector_stores=kb_vector_stores,
|
|
fetch_k_per_kb=max(12, payload.retrieval_top_k * 2),
|
|
top_k=payload.retrieval_top_k,
|
|
)
|
|
if retrieval_rows:
|
|
knowledge_context = format_retrieval_context(retrieval_rows)
|
|
except Exception as exc:
|
|
logger.exception(
|
|
"Testing generation retrieval fallback triggered for user=%s knowledge_base_ids=%s: %s",
|
|
current_user.id,
|
|
payload.knowledge_base_ids,
|
|
exc,
|
|
)
|
|
|
|
pipeline_kwargs = {
|
|
"user_requirement_text": payload.requirement_text,
|
|
"requirement_type_input": payload.requirement_type,
|
|
"debug": payload.debug,
|
|
"knowledge_context": knowledge_context,
|
|
"use_model_generation": payload.use_model_generation,
|
|
"max_items_per_group": payload.max_items_per_group,
|
|
"cases_per_item": payload.cases_per_item,
|
|
"max_focus_points": payload.max_focus_points,
|
|
"max_llm_calls": payload.max_llm_calls,
|
|
}
|
|
|
|
try:
|
|
result = await asyncio.wait_for(
|
|
asyncio.to_thread(run_testing_pipeline, **pipeline_kwargs),
|
|
timeout=MODEL_PIPELINE_TIMEOUT_SECONDS,
|
|
)
|
|
except asyncio.TimeoutError as exc:
|
|
logger.exception(
|
|
"Testing pipeline timed out for user=%s use_model_generation=%s after %s seconds",
|
|
current_user.id,
|
|
payload.use_model_generation,
|
|
MODEL_PIPELINE_TIMEOUT_SECONDS,
|
|
)
|
|
raise HTTPException(
|
|
status_code=504,
|
|
detail=f"LLM generation timed out after {MODEL_PIPELINE_TIMEOUT_SECONDS} seconds",
|
|
) from exc
|
|
except Exception as exc:
|
|
logger.exception(
|
|
"Testing pipeline failed for user=%s use_model_generation=%s: %s",
|
|
current_user.id,
|
|
payload.use_model_generation,
|
|
exc,
|
|
)
|
|
raise HTTPException(
|
|
status_code=500,
|
|
detail=f"LLM generation failed: {exc}",
|
|
) from exc
|
|
|
|
return result
|