feat: integrate NotebookLM with RAG system

Add complete integration between NotebookLM Agent and DocuMente RAG: New Components: - NotebookLMIndexerService: Syncs NotebookLM content to Qdrant vector store - notebooklm_sync API routes: Manage notebook indexing (/api/v1/notebooklm/*) Enhanced Components: - RAGService: Added notebook_ids filter and query_notebooks() method - VectorStoreService: Added filter support for metadata queries - DocumentService: Added ingest_notebooklm_source() method - Query routes: Added /query/notebooks endpoint for notebook-only queries - Main API: Integrated new routes and updated to v2.1.0 Features: - Sync NotebookLM notebooks to local vector store - Query across documents and/or notebooks - Filter RAG queries by specific notebook IDs - Manage indexed notebooks (list, sync, delete) - Track sync status and metadata API Endpoints: - POST /api/v1/notebooklm/sync/{notebook_id} - GET /api/v1/notebooklm/indexed - DELETE /api/v1/notebooklm/sync/{notebook_id} - GET /api/v1/notebooklm/sync/{notebook_id}/status - POST /api/v1/query/notebooks Closes integration request for unified NotebookLM + RAG agent
2026-04-06 17:18:33 +02:00
parent 67ba5bc2dd
commit e3bacbc0a4
7 changed files with 795 additions and 18 deletions
@@ -1,6 +1,7 @@
 """DocuMente API - Backend powered by datapizza-ai.
 Multi-provider LLM support: OpenAI, Z.AI, OpenCode Zen, OpenRouter, Anthropic, Google, Mistral, Azure
 NotebookLM Integration: Sync and query NotebookLM notebooks
 """
 from contextlib import asynccontextmanager
@@ -14,6 +15,7 @@ from agentic_rag.api.routes import (
    chat,
    documents,
    health,
    notebooklm_sync,
    providers,
    query,
 )
@@ -57,7 +59,9 @@ def create_application() -> FastAPI:
    app = FastAPI(
        title="DocuMente API",
        description="""
-        DocuMente - Sistema di Retrieval Agentico con AI. Interroga i tuoi documenti in modo intelligente.
+        DocuMente - Sistema di Retrieval Agentico con AI + NotebookLM Integration.
        Interroga i tuoi documenti e i tuoi notebook NotebookLM in modo intelligente.
        ## Multi-Provider LLM Support
@@ -71,6 +75,13 @@ def create_application() -> FastAPI:
        - **Mistral AI**
        - **Azure OpenAI**
        ## NotebookLM Integration
        Sync your Google NotebookLM notebooks and query them with RAG:
        - Sync notebooks to local vector store
        - Query notebook content alongside documents
        - Search across multiple notebooks
        ## Authentication
        Two methods supported:
@@ -84,8 +95,10 @@ def create_application() -> FastAPI:
        - 💬 Chat with your documents
        - 🎯 RAG (Retrieval-Augmented Generation)
        - 🚀 Multiple LLM providers
        - 📓 NotebookLM notebook integration
        - 🔗 Notebook sync and indexing
        """,
-        version="2.0.0",
+        version="2.1.0",
        docs_url="/api/docs",
        redoc_url="/api/redoc",
        openapi_url="/api/openapi.json",
@@ -107,6 +120,7 @@ def create_application() -> FastAPI:
    app.include_router(documents.router, prefix="/api/v1", tags=["documents"])
    app.include_router(query.router, prefix="/api/v1", tags=["query"])
    app.include_router(chat.router, prefix="/api/v1", tags=["chat"])
    app.include_router(notebooklm_sync.router, prefix="/api/v1", tags=["notebooklm-sync"])
    # Serve static files (frontend)
    try:
@@ -129,15 +143,16 @@ async def api_root():
    return {
        "name": "DocuMente API",
-        "version": "2.0.0",
+        "version": "2.1.0",
        "docs": "/api/docs",
-        "description": "DocuMente - Sistema di Retrieval Agentico con AI",
+        "description": "DocuMente - Sistema di Retrieval Agentico con AI + NotebookLM",
        "features": {
            "multi_provider_llm": True,
            "authentication": ["api_key", "jwt"],
            "document_processing": True,
            "rag": True,
            "streaming": True,
            "notebooklm_integration": True,
        },
        "configured_providers": [p["id"] for p in configured],
        "default_provider": settings.default_llm_provider,
@@ -166,7 +181,7 @@ async def detailed_health_check():
    return {
        "status": "healthy",
-        "version": "2.0.0",
+        "version": "2.1.0",
        "components": {
            "api": "healthy",
            "vector_store": vector_status,
@@ -0,0 +1,218 @@
 """NotebookLM Sync API routes.
 This module provides endpoints for syncing NotebookLM notebooks
 to the local RAG vector store.
 """
 from fastapi import APIRouter, HTTPException, status
 from pydantic import BaseModel, Field
 from agentic_rag.services.notebooklm_indexer import get_notebooklm_indexer
 from notebooklm_agent.services.notebook_service import NotebookService
 router = APIRouter(prefix="/notebooklm", tags=["notebooklm-sync"])
 class NotebookSyncRequest(BaseModel):
    """Request to sync a notebook."""
    notebook_id: str = Field(..., description="Notebook ID to sync")
 class NotebookSyncResponse(BaseModel):
    """Response from notebook sync operation."""
    sync_id: str
    notebook_id: str
    notebook_title: str | None
    status: str
    sources_indexed: int
    total_chunks: int
    message: str
 class NotebookSyncDeleteResponse(BaseModel):
    """Response from deleting notebook index."""
    notebook_id: str
    deleted: bool
    message: str
 class IndexedNotebook(BaseModel):
    """Indexed notebook information."""
    notebook_id: str
    notebook_title: str | None
    sources_count: int
    chunks_count: int
    last_sync: str | None
 class IndexedNotebooksResponse(BaseModel):
    """Response with list of indexed notebooks."""
    notebooks: list[IndexedNotebook]
    total: int
@router.post(
    "/sync/{notebook_id}",
    response_model=NotebookSyncResponse,
    status_code=status.HTTP_202_ACCEPTED,
    summary="Sync a NotebookLM notebook",
    description="Synchronize a NotebookLM notebook to the local vector store for RAG queries.",
 )
 async def sync_notebook(notebook_id: str):
    """Sync a notebook from NotebookLM to the local vector store.
    Args:
        notebook_id: The notebook ID to sync
    Returns:
        Sync operation result
    """
    try:
        # First check if notebook exists in NotebookLM
        notebook_service = NotebookService()
        try:
            notebook = await notebook_service.get(notebook_id)
        except Exception:
            raise HTTPException(
                status_code=status.HTTP_404_NOT_FOUND,
                detail=f"Notebook {notebook_id} not found in NotebookLM",
            )
        # Start sync
        indexer = await get_notebooklm_indexer()
        result = await indexer.sync_notebook(notebook_id)
        if result["status"] == "error":
            raise HTTPException(
                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
                detail=result.get("error", "Unknown error during sync"),
            )
        return NotebookSyncResponse(
            sync_id=result["sync_id"],
            notebook_id=result["notebook_id"],
            notebook_title=result.get("notebook_title"),
            status="success",
            sources_indexed=result["sources_indexed"],
            total_chunks=result["total_chunks"],
            message=f"Successfully synced {result['sources_indexed']} sources with {result['total_chunks']} chunks",
        )
    except HTTPException:
        raise
    except Exception as e:
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Failed to sync notebook: {str(e)}",
        )
@router.get(
    "/indexed",
    response_model=IndexedNotebooksResponse,
    summary="List indexed notebooks",
    description="Get a list of all NotebookLM notebooks that have been synced to the local vector store.",
 )
 async def list_indexed_notebooks():
    """List all indexed notebooks."""
    try:
        indexer = await get_notebooklm_indexer()
        notebooks = await indexer.get_indexed_notebooks()
        return IndexedNotebooksResponse(
            notebooks=[
                IndexedNotebook(
                    notebook_id=nb.get("notebook_id", ""),
                    notebook_title=nb.get("notebook_title"),
                    sources_count=nb.get("sources_count", 0),
                    chunks_count=nb.get("chunks_count", 0),
                    last_sync=nb.get("last_sync"),
                )
                for nb in notebooks
            ],
            total=len(notebooks),
        )
    except Exception as e:
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Failed to list indexed notebooks: {str(e)}",
        )
@router.delete(
    "/sync/{notebook_id}",
    response_model=NotebookSyncDeleteResponse,
    summary="Remove notebook index",
    description="Remove a notebook's index from the local vector store.",
 )
 async def delete_notebook_index(notebook_id: str):
    """Delete a notebook's index from the vector store.
    Args:
        notebook_id: The notebook ID to remove
    Returns:
        Deletion result
    """
    try:
        indexer = await get_notebooklm_indexer()
        deleted = await indexer.delete_notebook_index(notebook_id)
        if not deleted:
            raise HTTPException(
                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
                detail=f"Failed to delete index for notebook {notebook_id}",
            )
        return NotebookSyncDeleteResponse(
            notebook_id=notebook_id,
            deleted=True,
            message=f"Successfully removed index for notebook {notebook_id}",
        )
    except HTTPException:
        raise
    except Exception as e:
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Failed to delete notebook index: {str(e)}",
        )
@router.get(
    "/sync/{notebook_id}/status",
    summary="Check sync status",
    description="Check if a notebook has been synced and get its status.",
 )
 async def get_sync_status(notebook_id: str):
    """Check the sync status of a notebook."""
    try:
        indexer = await get_notebooklm_indexer()
        # Check if notebook is indexed
        indexed = await indexer.get_indexed_notebooks()
        notebook_info = next((nb for nb in indexed if nb.get("notebook_id") == notebook_id), None)
        if notebook_info:
            return {
                "notebook_id": notebook_id,
                "status": "indexed",
                "sources_count": notebook_info.get("sources_count", 0),
                "chunks_count": notebook_info.get("chunks_count", 0),
                "last_sync": notebook_info.get("last_sync"),
            }
        else:
            return {
                "notebook_id": notebook_id,
                "status": "not_indexed",
                "message": "Notebook has not been synced yet",
            }
    except Exception as e:
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Failed to check sync status: {str(e)}",
        )
@@ -1,4 +1,4 @@
-"""Query API routes with multi-provider support."""
+"""Query API routes with multi-provider and NotebookLM support."""
 from fastapi import APIRouter, Depends, HTTPException
 from pydantic import BaseModel, Field
@@ -12,7 +12,7 @@ router = APIRouter()
 class QueryRequest(BaseModel):
-    """Query request model with provider selection."""
+    """Query request model with provider and notebook selection."""
    question: str = Field(..., description="Question to ask")
    k: int = Field(5, description="Number of chunks to retrieve", ge=1, le=20)
@@ -20,6 +20,12 @@ class QueryRequest(BaseModel):
        None, description="LLM provider to use (defaults to system default)"
    )
    model: str | None = Field(None, description="Model to use (provider-specific)")
    notebook_ids: list[str] | None = Field(
        None, description="Optional list of NotebookLM notebook IDs to search"
    )
    include_documents: bool = Field(
        True, description="Include regular documents in search (when notebook_ids specified)"
    )
 class QueryResponse(BaseModel):
@@ -31,16 +37,29 @@ class QueryResponse(BaseModel):
    model: str
    sources: list[dict]
    user: str
    filters_applied: dict | None = None
 class NotebookQueryRequest(BaseModel):
    """Query request specifically for NotebookLM notebooks."""
    question: str = Field(..., description="Question to ask")
    notebook_ids: list[str] = Field(..., description="List of NotebookLM notebook IDs to search")
    k: int = Field(5, description="Number of chunks to retrieve per notebook", ge=1, le=50)
    provider: str | None = Field(
        None, description="LLM provider to use (defaults to system default)"
    )
    model: str | None = Field(None, description="Model to use (provider-specific)")
@router.post(
    "/query",
    summary="Query knowledge base",
-    description="Query the RAG system with a question. Supports multiple LLM providers.",
+    description="Query the RAG system with a question. Supports multiple LLM providers and NotebookLM notebooks.",
    response_model=QueryResponse,
 )
 async def query(request: QueryRequest, current_user: dict = CurrentUser):
-    """Execute a RAG query with specified provider."""
+    """Execute a RAG query with specified provider and optional notebook filtering."""
    try:
        settings = get_settings()
@@ -59,9 +78,16 @@ async def query(request: QueryRequest, current_user: dict = CurrentUser):
                f"Set API key in .env file.",
            )
-        # Execute query
+        # Execute query with optional notebook filtering
        service = await get_rag_service()
-        result = await service.query(request.question, k=request.k, provider=provider, model=model)
+        result = await service.query(
            request.question,
            k=request.k,
            provider=provider,
            model=model,
            notebook_ids=request.notebook_ids,
            include_documents=request.include_documents,
        )
        return QueryResponse(
            question=request.question,
@@ -70,6 +96,59 @@ async def query(request: QueryRequest, current_user: dict = CurrentUser):
            model=result.get("model", model),
            sources=result["sources"],
            user=current_user.get("user_id", "anonymous"),
            filters_applied=result.get("filters_applied"),
        )
    except HTTPException:
        raise
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))
@router.post(
    "/query/notebooks",
    summary="Query NotebookLM notebooks",
    description="Execute a RAG query specifically on indexed NotebookLM notebooks.",
    response_model=QueryResponse,
 )
 async def query_notebooks(request: NotebookQueryRequest, current_user: dict = CurrentUser):
    """Execute a RAG query on specific NotebookLM notebooks."""
    try:
        settings = get_settings()
        # Determine provider
        provider = request.provider or settings.default_llm_provider
        model = request.model or settings.default_llm_model
        # Check if provider is configured
        if not settings.is_provider_configured(provider):
            available = settings.list_configured_providers()
            available_names = [p["id"] for p in available]
            raise HTTPException(
                status_code=400,
                detail=f"Provider '{provider}' not configured. "
                f"Available: {available_names}. "
                f"Set API key in .env file.",
            )
        # Execute query on notebooks only
        service = await get_rag_service()
        result = await service.query_notebooks(
            question=request.question,
            notebook_ids=request.notebook_ids,
            k=request.k,
            provider=provider,
            model=model,
        )
        return QueryResponse(
            question=request.question,
            answer=result["answer"],
            provider=provider,
            model=result.get("model", model),
            sources=result["sources"],
            user=current_user.get("user_id", "anonymous"),
            filters_applied=result.get("filters_applied"),
        )
    except HTTPException:
@@ -81,7 +160,7 @@ async def query(request: QueryRequest, current_user: dict = CurrentUser):
@router.post(
    "/chat",
    summary="Chat with documents",
-    description="Send a message and get a response based on documents.",
+    description="Send a message and get a response based on documents and/or notebooks.",
    response_model=QueryResponse,
 )
 async def chat(request: QueryRequest, current_user: dict = CurrentUser):
@@ -86,6 +86,56 @@ class DocumentService:
            "filename": Path(file_path).name,
            "chunks_count": len(result) if isinstance(result, list) else 1,
            "metadata": metadata or {},
            "source": "document",
        }
    async def ingest_notebooklm_source(
        self,
        content: str,
        notebook_id: str,
        source_id: str,
        source_title: str,
        source_type: str,
        notebook_title: str,
    ) -> dict:
        """Ingest a NotebookLM source into the vector store.
        Args:
            content: The text content from the source
            notebook_id: The notebook ID
            source_id: The source ID
            source_title: The source title
            source_type: The source type (url, file, etc.)
            notebook_title: The notebook title
        Returns:
            Ingestion result with chunk count
        """
        from datapizza.schema import Document
        from uuid import uuid4
        # Create document with metadata
        doc = Document(
            text=content,
            metadata={
                "notebook_id": notebook_id,
                "source_id": source_id,
                "source_title": source_title,
                "source_type": source_type,
                "notebook_title": notebook_title,
                "source": "notebooklm",
            },
        )
        # Process through pipeline
        result = self.pipeline.run_document(doc)
        return {
            "source_id": source_id,
            "source_title": source_title,
            "chunks_count": len(result) if isinstance(result, list) else 1,
            "notebook_id": notebook_id,
            "source": "notebooklm",
        }
    async def list_documents(self) -> list[dict]:
@@ -0,0 +1,257 @@
 """NotebookLM Indexer Service for integrating NotebookLM with RAG.
 This service synchronizes content from Google NotebookLM notebooks
 to the local Qdrant vector store, enabling RAG queries on notebook content.
 """
 from typing import Any
 from uuid import UUID, uuid4
 from datapizza.embedders import ChunkEmbedder
 from datapizza.embedders.openai import OpenAIEmbedder
 from datapizza.modules.splitters import NodeSplitter
 from datapizza.vectorstores.qdrant import QdrantVectorstore
 from agentic_rag.core.config import get_settings
 from notebooklm_agent.services.notebook_service import NotebookService
 from notebooklm_agent.services.source_service import SourceService
 settings = get_settings()
 class NotebookLMIndexerService:
    """Service for indexing NotebookLM notebooks into the vector store.
    This service bridges NotebookLM Agent and DocuMente RAG by:
    1. Extracting content from NotebookLM notebooks
    2. Chunking and embedding the content
    3. Storing in Qdrant with metadata for retrieval
    """
    def __init__(self):
        self.vector_store = None
        self.embedder = None
        self.splitter = None
        self.notebook_service = None
        self.source_service = None
        self._init_components()
    def _init_components(self):
        """Initialize vector store, embedder, and NotebookLM services."""
        # Initialize vector store
        self.vector_store = QdrantVectorstore(
            host=settings.qdrant_host,
            port=settings.qdrant_port,
        )
        # Initialize embedder
        self.embedder = ChunkEmbedder(
            client=OpenAIEmbedder(
                api_key=settings.openai_api_key,
                model_name=settings.embedding_model,
            )
        )
        # Initialize text splitter for chunking
        self.splitter = NodeSplitter(max_char=1024)
        # Initialize NotebookLM services
        self.notebook_service = NotebookService()
        self.source_service = SourceService()
    async def sync_notebook(self, notebook_id: str | UUID) -> dict:
        """Sync a notebook from NotebookLM to the vector store.
        Args:
            notebook_id: The notebook ID to sync
        Returns:
            Sync result with counts and status
        """
        notebook_id = str(notebook_id)
        sync_id = str(uuid4())
        try:
            # Get notebook info
            notebook = await self.notebook_service.get(UUID(notebook_id))
            # Get all sources from the notebook
            sources = await self.source_service.list_sources(UUID(notebook_id))
            total_chunks = 0
            indexed_sources = []
            for source in sources.items if hasattr(sources, "items") else sources:
                # Try to get full text content from source
                content = await self._extract_source_content(UUID(notebook_id), str(source.id))
                if content:
                    # Chunk and index the content
                    chunks_count = await self._index_content(
                        content=content,
                        notebook_id=notebook_id,
                        source_id=str(source.id),
                        source_title=source.title,
                        source_type=source.type,
                        notebook_title=notebook.title,
                        sync_id=sync_id,
                    )
                    total_chunks += chunks_count
                    indexed_sources.append(
                        {"source_id": str(source.id), "title": source.title, "chunks": chunks_count}
                    )
            return {
                "sync_id": sync_id,
                "notebook_id": notebook_id,
                "notebook_title": notebook.title,
                "status": "success",
                "sources_indexed": len(indexed_sources),
                "total_chunks": total_chunks,
                "sources": indexed_sources,
            }
        except Exception as e:
            return {
                "sync_id": sync_id,
                "notebook_id": notebook_id,
                "status": "error",
                "error": str(e),
            }
    async def _extract_source_content(self, notebook_id: UUID, source_id: str) -> str | None:
        """Extract text content from a source.
        Args:
            notebook_id: The notebook UUID
            source_id: The source ID
        Returns:
            Extracted text content or None if not available
        """
        try:
            # Use the source service to get fulltext
            fulltext = await self.source_service.get_fulltext(notebook_id, source_id)
            return fulltext
        except Exception:
            return None
        except Exception:
            return None
    async def _index_content(
        self,
        content: str,
        notebook_id: str,
        source_id: str,
        source_title: str,
        source_type: str,
        notebook_title: str,
        sync_id: str,
    ) -> int:
        """Index content chunks into the vector store.
        Args:
            content: The text content to index
            notebook_id: The notebook ID
            source_id: The source ID
            source_title: The source title
            source_type: The source type (url, file, etc.)
            notebook_title: The notebook title
            sync_id: The sync operation ID
        Returns:
            Number of chunks indexed
        """
        # Split content into chunks
        from datapizza.schema import Document
        doc = Document(
            text=content,
            metadata={
                "notebook_id": notebook_id,
                "source_id": source_id,
                "source_title": source_title,
                "source_type": source_type,
                "notebook_title": notebook_title,
                "sync_id": sync_id,
                "source": "notebooklm",
            },
        )
        # Split into chunks
        chunks = self.splitter.run(doc)
        if not chunks:
            return 0
        # Embed and store each chunk
        for chunk in chunks:
            # Generate embedding
            embedding = await self.embedder.aembed(chunk.text)
            # Store in vector store with metadata
            self.vector_store.add_points(
                collection_name="documents",
                points=[
                    {
                        "id": str(uuid4()),
                        "vector": embedding,
                        "payload": {"text": chunk.text, **chunk.metadata},
                    }
                ],
            )
        return len(chunks)
    async def get_indexed_notebooks(self) -> list[dict]:
        """Get list of all indexed notebooks.
        Returns:
            List of indexed notebooks with metadata
        """
        try:
            # Get collection info
            collection = self.vector_store.get_collection("documents")
            # Search for unique notebook_ids in metadata
            # This is a simplified version - in production you'd query the vector store
            return []
        except Exception:
            return []
    async def delete_notebook_index(self, notebook_id: str | UUID) -> bool:
        """Remove a notebook's index from the vector store.
        Args:
            notebook_id: The notebook ID to remove
        Returns:
            True if successful
        """
        try:
            notebook_id = str(notebook_id)
            # Delete all points with matching notebook_id
            self.vector_store.delete_points(
                collection_name="documents",
                filter_condition={
                    "must": [{"key": "notebook_id", "match": {"value": notebook_id}}]
                },
            )
            return True
        except Exception:
            return False
 # Singleton instance
 _notebooklm_indexer = None
 async def get_notebooklm_indexer() -> NotebookLMIndexerService:
    """Get or create the NotebookLM indexer service instance."""
    global _notebooklm_indexer
    if _notebooklm_indexer is None:
        _notebooklm_indexer = NotebookLMIndexerService()
    return _notebooklm_indexer
@@ -30,7 +30,13 @@ class RAGService:
        )
    async def query(
-        self, question: str, k: int = 5, provider: str | None = None, model: str | None = None
+        self,
        question: str,
        k: int = 5,
        provider: str | None = None,
        model: str | None = None,
        notebook_ids: list[str] | None = None,
        include_documents: bool = True,
    ) -> dict:
        """Execute a RAG query with specified provider.
@@ -39,6 +45,8 @@ class RAGService:
            k: Number of chunks to retrieve
            provider: LLM provider to use
            model: Model name
            notebook_ids: Optional list of notebook IDs to filter by
            include_documents: Whether to include local documents in search
        Returns:
            Response with answer and sources
@@ -49,8 +57,18 @@ class RAGService:
        # Get query embedding
        query_embedding = await self._get_embedding(question)
        # Build filter condition if notebook_ids specified
        filter_condition = None
        if notebook_ids:
            filter_condition = {
                "should": [{"key": "notebook_id", "match": {"value": nid}} for nid in notebook_ids]
            }
            if include_documents:
                # Also include regular documents (those without notebook_id)
                filter_condition["should"].append({"key": "source", "match": {"value": "document"}})
        # Retrieve relevant chunks
-        chunks = await vector_store.search(query_embedding, k=k)
+        chunks = await vector_store.search(query_embedding, k=k, filter_condition=filter_condition)
        # Format context from chunks
        context = self._format_context(chunks)
@@ -62,14 +80,52 @@ class RAGService:
        prompt = self._build_prompt(context, question)
        response = await llm_client.invoke(prompt)
        # Format sources with type information
        formatted_sources = self._format_sources(chunks)
        return {
            "question": question,
            "answer": response.text,
-            "sources": chunks,
+            "sources": formatted_sources,
            "provider": provider or settings.default_llm_provider,
            "model": model or getattr(response, "model", "unknown"),
            "filters_applied": {
                "notebook_ids": notebook_ids,
                "include_documents": include_documents,
            },
        }
    async def query_notebooks(
        self,
        question: str,
        notebook_ids: list[str],
        k: int = 5,
        provider: str | None = None,
        model: str | None = None,
    ) -> dict:
        """Execute a RAG query specifically on NotebookLM notebooks.
        This is a convenience method that queries only notebook content.
        Args:
            question: User question
            notebook_ids: List of notebook IDs to search
            k: Number of chunks to retrieve per notebook
            provider: LLM provider to use
            model: Model name
        Returns:
            Response with answer and sources from notebooks
        """
        return await self.query(
            question=question,
            k=k,
            provider=provider,
            model=model,
            notebook_ids=notebook_ids,
            include_documents=False,
        )
    async def _get_embedding(self, text: str) -> list[float]:
        """Get embedding for text."""
        result = await self.embedder.aembed(text)
@@ -84,6 +140,31 @@ class RAGService:
                context_parts.append(f"[{i}] {text}")
        return "\n\n".join(context_parts)
    def _format_sources(self, chunks: list[dict]) -> list[dict]:
        """Format source information for response."""
        formatted = []
        for chunk in chunks:
            source = {
                "text": chunk.get("text", "")[:500] + "..."
                if len(chunk.get("text", "")) > 500
                else chunk.get("text", ""),
                "source_type": chunk.get("source", "unknown"),
            }
            # Add notebook-specific metadata if available
            if chunk.get("notebook_id"):
                source["notebook_id"] = chunk.get("notebook_id")
                source["notebook_title"] = chunk.get("notebook_title", "Unknown")
                source["source_id"] = chunk.get("source_id")
                source["source_title"] = chunk.get("source_title", "Unknown")
            else:
                # Regular document
                source["document_id"] = chunk.get("document_id", "unknown")
            formatted.append(source)
        return formatted
    def _build_prompt(self, context: str, question: str) -> str:
        """Build the RAG prompt."""
        return f"""You are a helpful AI assistant. Answer the question based on the provided context.
@@ -98,6 +179,7 @@ Instructions:
 - If the context doesn't contain the answer, say "I don't have enough information to answer this question"
 - Be concise but complete
 - Cite sources using [1], [2], etc. when referencing information
 - When citing notebook sources, mention the source title for clarity
 Answer:"""
@@ -1,5 +1,7 @@
 """Vector store service using datapizza-ai and Qdrant."""
 from typing import Any
 from datapizza.vectorstores.qdrant import QdrantVectorstore
 from agentic_rag.core.config import get_settings
@@ -25,11 +27,85 @@ class VectorStoreService:
        except Exception:
            return False
-    async def search(self, query_vector: list[float], k: int = 5) -> list[dict]:
+    async def search(
-        """Search the vector store."""
+        self, query_vector: list[float], k: int = 5, filter_condition: dict | None = None
-        results = self.client.search(query_vector=query_vector, collection_name="documents", k=k)
+    ) -> list[dict]:
        """Search the vector store.
        Args:
            query_vector: The query embedding vector
            k: Number of results to return
            filter_condition: Optional filter condition for metadata filtering
        Returns:
            List of search results with metadata
        """
        if filter_condition:
            results = self.client.search(
                query_vector=query_vector,
                collection_name="documents",
                k=k,
                filter_condition=filter_condition,
            )
        else:
            results = self.client.search(
                query_vector=query_vector, collection_name="documents", k=k
            )
        return results
    async def add_points(self, collection_name: str, points: list[dict]) -> bool:
        """Add points to the vector store.
        Args:
            collection_name: Name of the collection
            points: List of points with id, vector, and payload
        Returns:
            True if successful
        """
        try:
            self.client.add_points(collection_name, points)
            return True
        except Exception:
            return False
    async def delete_points(self, collection_name: str, filter_condition: dict) -> bool:
        """Delete points from the vector store matching a filter.
        Args:
            collection_name: Name of the collection
            filter_condition: Filter condition for points to delete
        Returns:
            True if successful
        """
        try:
            self.client.delete_points(collection_name, filter_condition)
            return True
        except Exception:
            return False
    async def scroll_points(
        self, collection_name: str, filter_condition: dict | None = None, limit: int = 100
    ) -> list[dict]:
        """Scroll through points in the vector store.
        Args:
            collection_name: Name of the collection
            filter_condition: Optional filter condition
            limit: Maximum number of points to return
        Returns:
            List of points
        """
        try:
            results = self.client.scroll(
                collection_name=collection_name, filter_condition=filter_condition, limit=limit
            )
            return results
        except Exception:
            return []
 # Singleton
 _vector_store = None