from typing import Any, Dict, List from fastapi import APIRouter, Depends from sqlalchemy.orm import Session from app.core.config import settings from app.core.security import get_current_user from app.db.session import get_db from app.models.knowledge import Document, KnowledgeBase from app.models.user import User from app.schemas.testing import TestingPipelineRequest, TestingPipelineResponse from app.services.embedding.embedding_factory import EmbeddingsFactory from app.services.retrieval.multi_kb_retriever import MultiKBRetriever, format_retrieval_context from app.services.testing_pipeline import run_testing_pipeline from app.services.vector_store import VectorStoreFactory router = APIRouter() async def _build_kb_vector_stores(db: Session, knowledge_bases: List[KnowledgeBase]) -> List[Dict[str, Any]]: embeddings = EmbeddingsFactory.create() kb_vector_stores: List[Dict[str, Any]] = [] for kb in knowledge_bases: documents = db.query(Document).filter(Document.knowledge_base_id == kb.id).all() if not documents: continue store = VectorStoreFactory.create( store_type=settings.VECTOR_STORE_TYPE, collection_name=f"kb_{kb.id}", embedding_function=embeddings, ) kb_vector_stores.append({"kb_id": kb.id, "store": store}) return kb_vector_stores @router.post("/generate", response_model=TestingPipelineResponse) async def generate_testing_content( *, payload: TestingPipelineRequest, current_user: User = Depends(get_current_user), db: Session = Depends(get_db), ) -> Any: _ = current_user knowledge_context = (payload.knowledge_context or "").strip() if payload.knowledge_base_ids: knowledge_bases = ( db.query(KnowledgeBase) .filter( KnowledgeBase.id.in_(payload.knowledge_base_ids), KnowledgeBase.user_id == current_user.id, ) .all() ) kb_vector_stores = await _build_kb_vector_stores(db, knowledge_bases) if kb_vector_stores: retriever = MultiKBRetriever( reranker_weight=settings.RERANKER_WEIGHT, ) retrieval_rows = await retriever.retrieve( query=payload.requirement_text, kb_vector_stores=kb_vector_stores, fetch_k_per_kb=max(12, payload.retrieval_top_k * 2), top_k=payload.retrieval_top_k, ) if retrieval_rows: knowledge_context = format_retrieval_context(retrieval_rows) result = run_testing_pipeline( user_requirement_text=payload.requirement_text, requirement_type_input=payload.requirement_type, debug=payload.debug, knowledge_context=knowledge_context, use_model_generation=payload.use_model_generation, max_items_per_group=payload.max_items_per_group, cases_per_item=payload.cases_per_item, max_focus_points=payload.max_focus_points, max_llm_calls=payload.max_llm_calls, ) return result