Primera version de chunkeo completo crud

2025-11-05 19:18:11 +00:00
parent df2c184814
commit 7c6e8c4858
36 changed files with 6242 additions and 5 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -350,6 +350,8 @@ docker-compose.override.yml
 .env.*.local
 config.json
 secrets.json
 .secrets/
 **/.secrets/
 # === ARCHIVOS DE RESPALDO ===
 *.bak
--- a/backend/app/pycache/main.cpython-312.pyc
+++ b/backend/app/pycache/main.cpython-312.pyc
--- a/backend/app/core/pycache/config.cpython-312.pyc
+++ b/backend/app/core/pycache/config.cpython-312.pyc
--- a/backend/app/core/config.py
+++ b/backend/app/core/config.py
@@ -26,14 +26,74 @@ class Settings(BaseSettings):
    AZURE_STORAGE_CONNECTION_STRING: str
    AZURE_STORAGE_ACCOUNT_NAME: str = ""
    AZURE_CONTAINER_NAME: str = "files"
-    
+
    # Qdrant Vector DB configuración
    QDRANT_URL: str
    QDRANT_API_KEY: str
    VECTOR_DB_TYPE: str = "qdrant"  # Para futuro: soportar otros tipos
    # Azure OpenAI configuración
    AZURE_OPENAI_ENDPOINT: str
    AZURE_OPENAI_API_KEY: str
    AZURE_OPENAI_API_VERSION: str = "2024-02-01"
    AZURE_OPENAI_EMBEDDING_MODEL: str = "text-embedding-3-large"
    AZURE_OPENAI_EMBEDDING_DEPLOYMENT: str = "text-embedding-3-large"
    # Google Cloud / Vertex AI configuración
    GOOGLE_APPLICATION_CREDENTIALS: str
    GOOGLE_CLOUD_PROJECT: str
    GOOGLE_CLOUD_LOCATION: str = "us-central1"
    GEMINI_MODEL: str = "gemini-2.0-flash"
    @validator("AZURE_STORAGE_CONNECTION_STRING")
    def validate_azure_connection_string(cls, v):
        """Validar que el connection string de Azure esté presente"""
        if not v:
            raise ValueError("AZURE_STORAGE_CONNECTION_STRING es requerido")
        return v
-    
+
    @validator("QDRANT_URL")
    def validate_qdrant_url(cls, v):
        """Validar que la URL de Qdrant esté presente"""
        if not v:
            raise ValueError("QDRANT_URL es requerido")
        return v
    @validator("QDRANT_API_KEY")
    def validate_qdrant_api_key(cls, v):
        """Validar que la API key de Qdrant esté presente"""
        if not v:
            raise ValueError("QDRANT_API_KEY es requerido")
        return v
    @validator("AZURE_OPENAI_ENDPOINT")
    def validate_azure_openai_endpoint(cls, v):
        """Validar que el endpoint de Azure OpenAI esté presente"""
        if not v:
            raise ValueError("AZURE_OPENAI_ENDPOINT es requerido")
        return v
    @validator("AZURE_OPENAI_API_KEY")
    def validate_azure_openai_api_key(cls, v):
        """Validar que la API key de Azure OpenAI esté presente"""
        if not v:
            raise ValueError("AZURE_OPENAI_API_KEY es requerido")
        return v
    @validator("GOOGLE_APPLICATION_CREDENTIALS")
    def validate_google_credentials(cls, v):
        """Validar que el path de credenciales de Google esté presente"""
        if not v:
            raise ValueError("GOOGLE_APPLICATION_CREDENTIALS es requerido")
        return v
    @validator("GOOGLE_CLOUD_PROJECT")
    def validate_google_project(cls, v):
        """Validar que el proyecto de Google Cloud esté presente"""
        if not v:
            raise ValueError("GOOGLE_CLOUD_PROJECT es requerido")
        return v
    class Config:
        env_file = ".env"
        case_sensitive = True
--- a/backend/app/main.py
+++ b/backend/app/main.py
@@ -6,6 +6,8 @@ import logging
 # Import routers
 from .routers.files import router as files_router
 from .routers.vectors import router as vectors_router
 from .routers.chunking import router as chunking_router
 from .core.config import settings
 # from routers.ai import router as ai_router  #  futuro con Azure OpenAI
@@ -98,6 +100,18 @@ app.include_router(
    tags=["files"]
 )
 app.include_router(
    vectors_router,
    prefix="/api/v1",
    tags=["vectors"]
 )
 app.include_router(
    chunking_router,
    prefix="/api/v1",
    tags=["chunking"]
 )
 # Router para IA
 # app.include_router(
 #     ai_router,
@@ -110,6 +124,7 @@ app.include_router(
 async def startup_event():
    logger.info("Iniciando File Manager API...")
    logger.info(f"Conectando a Azure Storage Account: {settings.AZURE_STORAGE_ACCOUNT_NAME}")
    logger.info(f"Conectando a Qdrant: {settings.QDRANT_URL}")
    #  validaciones de conexión a Azure
--- a/backend/app/models/chunking_models.py
+++ b/backend/app/models/chunking_models.py
@@ -0,0 +1,128 @@
 """
 Modelos Pydantic para las operaciones de chunking.
 """
 from pydantic import BaseModel, Field, validator
 from typing import List, Dict, Any, Optional
 # Request Models
 class ChunkingPreviewRequest(BaseModel):
    """Request para generar preview de chunks"""
    file_name: str = Field(..., description="Nombre del archivo PDF")
    tema: str = Field(..., description="Tema/carpeta del archivo")
    max_tokens: int = Field(default=950, ge=100, le=2000, description="Límite máximo de tokens por chunk")
    target_tokens: int = Field(default=800, ge=100, le=2000, description="Tokens objetivo")
    chunk_size: int = Field(default=1000, ge=100, le=3000, description="Tamaño del chunk")
    chunk_overlap: int = Field(default=200, ge=0, le=1000, description="Solapamiento entre chunks")
    use_llm: bool = Field(default=True, description="Usar LLM (Gemini) para procesamiento inteligente")
    custom_instructions: str = Field(default="", description="Instrucciones personalizadas (solo si use_llm=True)")
    @validator("custom_instructions")
    def validate_custom_instructions(cls, v, values):
        """Valida que custom_instructions solo se use con LLM habilitado"""
        if v and not values.get("use_llm", True):
            raise ValueError("custom_instructions solo puede usarse cuando use_llm=True")
        return v
    @validator("target_tokens")
    def validate_target_tokens(cls, v, values):
        """Valida que target_tokens sea menor que max_tokens"""
        if "max_tokens" in values and v >= values["max_tokens"]:
            raise ValueError("target_tokens debe ser menor que max_tokens")
        return v
 class ChunkingProcessRequest(BaseModel):
    """Request para procesar PDF completo"""
    file_name: str = Field(..., description="Nombre del archivo PDF")
    tema: str = Field(..., description="Tema/carpeta del archivo")
    collection_name: str = Field(..., description="Nombre de la colección en Qdrant")
    max_tokens: int = Field(default=950, ge=100, le=2000, description="Límite máximo de tokens por chunk")
    target_tokens: int = Field(default=800, ge=100, le=2000, description="Tokens objetivo")
    chunk_size: int = Field(default=1000, ge=100, le=3000, description="Tamaño del chunk")
    chunk_overlap: int = Field(default=200, ge=0, le=1000, description="Solapamiento entre chunks")
    use_llm: bool = Field(default=True, description="Usar LLM (Gemini) para procesamiento inteligente")
    custom_instructions: str = Field(default="", description="Instrucciones personalizadas (solo si use_llm=True)")
    @validator("custom_instructions")
    def validate_custom_instructions(cls, v, values):
        """Valida que custom_instructions solo se use con LLM habilitado"""
        if v and not values.get("use_llm", True):
            raise ValueError("custom_instructions solo puede usarse cuando use_llm=True")
        return v
    @validator("target_tokens")
    def validate_target_tokens(cls, v, values):
        """Valida que target_tokens sea menor que max_tokens"""
        if "max_tokens" in values and v >= values["max_tokens"]:
            raise ValueError("target_tokens debe ser menor que max_tokens")
        return v
 # Response Models
 class ChunkPreview(BaseModel):
    """Modelo para un chunk de preview"""
    index: int = Field(..., description="Índice del chunk")
    text: str = Field(..., description="Contenido del chunk")
    page: int = Field(..., description="Número de página")
    file_name: str = Field(..., description="Nombre del archivo")
    tokens: int = Field(..., description="Número aproximado de tokens")
 class ChunkingPreviewResponse(BaseModel):
    """Response para preview de chunks"""
    success: bool = Field(default=True, description="Indica si la operación fue exitosa")
    file_name: str = Field(..., description="Nombre del archivo procesado")
    tema: str = Field(..., description="Tema del archivo")
    chunks: List[ChunkPreview] = Field(..., description="Lista de chunks de preview (hasta 3)")
    message: str = Field(default="Preview generado exitosamente", description="Mensaje descriptivo")
    @validator("chunks")
    def validate_chunk_count(cls, v):
        """Valida que haya al menos 1 chunk y máximo 3 chunks en el preview"""
        if len(v) < 1:
            raise ValueError("El preview debe contener al menos 1 chunk")
        if len(v) > 3:
            raise ValueError("El preview no puede contener más de 3 chunks")
        return v
 class ChunkingProcessResponse(BaseModel):
    """Response para procesamiento completo"""
    success: bool = Field(..., description="Indica si la operación fue exitosa")
    collection_name: str = Field(..., description="Nombre de la colección")
    file_name: str = Field(..., description="Nombre del archivo procesado")
    total_chunks: int = Field(..., description="Total de chunks generados")
    chunks_added: int = Field(..., description="Chunks agregados a Qdrant")
    message: str = Field(..., description="Mensaje descriptivo")
 # Profile Models
 class ChunkingProfile(BaseModel):
    """Perfil de configuración predefinido para chunking"""
    id: str = Field(..., description="ID del perfil")
    name: str = Field(..., description="Nombre del perfil")
    description: str = Field(..., description="Descripción del perfil")
    max_tokens: int = Field(..., description="Límite máximo de tokens")
    target_tokens: int = Field(..., description="Tokens objetivo")
    chunk_size: int = Field(..., description="Tamaño del chunk")
    chunk_overlap: int = Field(..., description="Solapamiento")
    use_llm: bool = Field(..., description="Si usa LLM")
 class ChunkingProfilesResponse(BaseModel):
    """Response con perfiles disponibles"""
    profiles: List[ChunkingProfile] = Field(..., description="Lista de perfiles disponibles")
 # Progress Models (para WebSockets)
 class ChunkingProgress(BaseModel):
    """Modelo para reportar progreso de chunking"""
    status: str = Field(..., description="Estado actual: downloading, chunking, embedding, uploading, completed, error")
    progress: int = Field(..., ge=0, le=100, description="Progreso en porcentaje")
    message: Optional[str] = Field(None, description="Mensaje adicional")
    error: Optional[str] = Field(None, description="Mensaje de error si status=error")
--- a/backend/app/models/vector_models.py
+++ b/backend/app/models/vector_models.py
@@ -0,0 +1,184 @@
 """
 Modelos Pydantic para operaciones con bases de datos vectoriales.
 Este módulo define todos los modelos de datos para requests y responses
 relacionados con la gestión de colecciones y chunks en bases de datos vectoriales.
 """
 from typing import List, Optional, Dict, Any
 from pydantic import BaseModel, Field, validator
 # ============================================================================
 # Modelos para Colecciones
 # ============================================================================
 class CollectionExistsRequest(BaseModel):
    """Request para verificar si una colección existe."""
    collection_name: str = Field(..., description="Nombre de la colección a verificar")
 class CollectionExistsResponse(BaseModel):
    """Response de verificación de existencia de colección."""
    exists: bool = Field(..., description="True si la colección existe")
    collection_name: str = Field(..., description="Nombre de la colección")
 class CollectionCreateRequest(BaseModel):
    """Request para crear una nueva colección."""
    collection_name: str = Field(..., description="Nombre de la colección a crear")
    vector_size: int = Field(default=3072, description="Dimensión de los vectores")
    distance: str = Field(default="Cosine", description="Métrica de distancia")
    @validator("distance")
    def validate_distance(cls, v):
        """Valida que la métrica de distancia sea válida."""
        allowed = ["Cosine", "Euclid", "Dot"]
        if v not in allowed:
            raise ValueError(f"Métrica de distancia debe ser una de: {allowed}")
        return v
    @validator("vector_size")
    def validate_vector_size(cls, v):
        """Valida que el tamaño del vector sea positivo."""
        if v <= 0:
            raise ValueError("El tamaño del vector debe ser mayor a 0")
        return v
 class CollectionCreateResponse(BaseModel):
    """Response de creación de colección."""
    success: bool = Field(..., description="True si se creó exitosamente")
    collection_name: str = Field(..., description="Nombre de la colección creada")
    message: str = Field(..., description="Mensaje descriptivo")
 class CollectionDeleteResponse(BaseModel):
    """Response de eliminación de colección."""
    success: bool = Field(..., description="True si se eliminó exitosamente")
    collection_name: str = Field(..., description="Nombre de la colección eliminada")
    message: str = Field(..., description="Mensaje descriptivo")
 class CollectionInfoResponse(BaseModel):
    """Response con información de una colección."""
    name: str = Field(..., description="Nombre de la colección")
    vectors_count: int = Field(..., description="Número total de vectores")
    vectors_config: Dict[str, Any] = Field(..., description="Configuración de vectores")
    status: str = Field(..., description="Estado de la colección")
 # ============================================================================
 # Modelos para Archivos en Colecciones
 # ============================================================================
 class FileExistsInCollectionRequest(BaseModel):
    """Request para verificar si un archivo existe en una colección."""
    collection_name: str = Field(..., description="Nombre de la colección")
    file_name: str = Field(..., description="Nombre del archivo a verificar")
 class FileExistsInCollectionResponse(BaseModel):
    """Response de verificación de existencia de archivo."""
    exists: bool = Field(..., description="True si el archivo existe")
    collection_name: str = Field(..., description="Nombre de la colección")
    file_name: str = Field(..., description="Nombre del archivo")
    chunk_count: Optional[int] = Field(None, description="Número de chunks del archivo si existe")
 # ============================================================================
 # Modelos para Chunks
 # ============================================================================
 class ChunkMetadata(BaseModel):
    """Metadata de un chunk."""
    file_name: str = Field(..., description="Nombre del archivo")
    page: int = Field(..., description="Número de página")
    text: Optional[str] = Field(None, description="Texto del chunk")
    # Se pueden agregar más campos según necesidad
 class ChunkData(BaseModel):
    """Datos completos de un chunk."""
    id: str = Field(..., description="ID único del chunk")
    payload: ChunkMetadata = Field(..., description="Metadata del chunk")
    vector: Optional[List[float]] = Field(None, description="Vector de embeddings")
 class GetChunksByFileRequest(BaseModel):
    """Request para obtener chunks de un archivo."""
    collection_name: str = Field(..., description="Nombre de la colección")
    file_name: str = Field(..., description="Nombre del archivo")
    limit: Optional[int] = Field(None, description="Límite de chunks a retornar")
    @validator("limit")
    def validate_limit(cls, v):
        """Valida que el límite sea positivo si está presente."""
        if v is not None and v <= 0:
            raise ValueError("El límite debe ser mayor a 0")
        return v
 class GetChunksByFileResponse(BaseModel):
    """Response con los chunks de un archivo."""
    collection_name: str = Field(..., description="Nombre de la colección")
    file_name: str = Field(..., description="Nombre del archivo")
    chunks: List[Dict[str, Any]] = Field(..., description="Lista de chunks")
    total_chunks: int = Field(..., description="Número total de chunks")
 class DeleteFileFromCollectionRequest(BaseModel):
    """Request para eliminar un archivo de una colección."""
    collection_name: str = Field(..., description="Nombre de la colección")
    file_name: str = Field(..., description="Nombre del archivo a eliminar")
 class DeleteFileFromCollectionResponse(BaseModel):
    """Response de eliminación de archivo."""
    success: bool = Field(..., description="True si se eliminó exitosamente")
    collection_name: str = Field(..., description="Nombre de la colección")
    file_name: str = Field(..., description="Nombre del archivo eliminado")
    chunks_deleted: int = Field(..., description="Número de chunks eliminados")
    message: str = Field(..., description="Mensaje descriptivo")
 class AddChunksRequest(BaseModel):
    """Request para agregar chunks a una colección."""
    collection_name: str = Field(..., description="Nombre de la colección")
    chunks: List[Dict[str, Any]] = Field(..., description="Lista de chunks a agregar")
    @validator("chunks")
    def validate_chunks(cls, v):
        """Valida que la lista de chunks no esté vacía."""
        if not v:
            raise ValueError("La lista de chunks no puede estar vacía")
        return v
 class AddChunksResponse(BaseModel):
    """Response de agregado de chunks."""
    success: bool = Field(..., description="True si se agregaron exitosamente")
    collection_name: str = Field(..., description="Nombre de la colección")
    chunks_added: int = Field(..., description="Número de chunks agregados")
    message: str = Field(..., description="Mensaje descriptivo")
 # ============================================================================
 # Modelos para Health Check
 # ============================================================================
 class VectorDBHealthResponse(BaseModel):
    """Response del health check de la base de datos vectorial."""
    status: str = Field(..., description="Estado de la conexión")
    db_type: str = Field(..., description="Tipo de base de datos vectorial")
    message: str = Field(..., description="Mensaje descriptivo")
 # ============================================================================
 # Modelos para Errores
 # ============================================================================
 class VectorDBErrorResponse(BaseModel):
    """Response genérico de error."""
    error: str = Field(..., description="Descripción del error")
    detail: Optional[str] = Field(None, description="Detalle adicional del error")
--- a/backend/app/routers/chunking.py
+++ b/backend/app/routers/chunking.py
@@ -0,0 +1,183 @@
 """
 Router para operaciones de chunking de PDFs.
 Endpoints para generar preview y procesar PDFs completos.
 """
 import logging
 from fastapi import APIRouter, HTTPException, status
 from typing import List
 from ..models.chunking_models import (
    ChunkingPreviewRequest,
    ChunkingPreviewResponse,
    ChunkingProcessRequest,
    ChunkingProcessResponse,
    ChunkingProfilesResponse,
    ChunkingProfile,
    ChunkPreview
 )
 from ..services.chunking_service import get_chunking_service
 logger = logging.getLogger(__name__)
 router = APIRouter(prefix="/chunking", tags=["chunking"])
 # Perfiles predefinidos
 CHUNKING_PROFILES = [
    ChunkingProfile(
        id="balanced",
        name="Balanceado",
        description="Configuración equilibrada entre velocidad y calidad",
        max_tokens=950,
        target_tokens=800,
        chunk_size=1000,
        chunk_overlap=200,
        use_llm=True
    ),
    ChunkingProfile(
        id="detailed",
        name="Detallado",
        description="Chunks más grandes para mantener más contexto",
        max_tokens=1500,
        target_tokens=1200,
        chunk_size=1500,
        chunk_overlap=300,
        use_llm=True
    ),
    ChunkingProfile(
        id="compact",
        name="Compacto",
        description="Chunks más pequeños para búsquedas precisas",
        max_tokens=600,
        target_tokens=500,
        chunk_size=700,
        chunk_overlap=150,
        use_llm=True
    ),
    ChunkingProfile(
        id="fast",
        name="Rápido",
        description="Sin LLM, solo procesamiento básico",
        max_tokens=950,
        target_tokens=800,
        chunk_size=1000,
        chunk_overlap=200,
        use_llm=False
    ),
 ]
@router.get("/profiles", response_model=ChunkingProfilesResponse)
 async def get_chunking_profiles():
    """
    Obtiene los perfiles de configuración predefinidos para chunking.
    Returns:
        Lista de perfiles disponibles
    """
    return ChunkingProfilesResponse(profiles=CHUNKING_PROFILES)
@router.post("/preview", response_model=ChunkingPreviewResponse)
 async def generate_preview(request: ChunkingPreviewRequest):
    """
    Genera preview de chunks para un PDF (hasta 3 chunks).
    Args:
        request: Configuración de chunking y ubicación del archivo
    Returns:
        Preview con chunks de ejemplo (máximo 3, mínimo 1)
    Raises:
        HTTPException: Si hay error generando el preview
    """
    try:
        logger.info(f"Generando preview para {request.file_name} (tema: {request.tema})")
        chunking_service = get_chunking_service()
        chunks = await chunking_service.process_pdf_preview(
            file_name=request.file_name,
            tema=request.tema,
            max_tokens=request.max_tokens,
            target_tokens=request.target_tokens,
            chunk_size=request.chunk_size,
            chunk_overlap=request.chunk_overlap,
            use_llm=request.use_llm,
            custom_instructions=request.custom_instructions
        )
        # Convertir a modelos Pydantic
        chunk_previews = [
            ChunkPreview(
                index=chunk["index"],
                text=chunk["text"],
                page=chunk["page"],
                file_name=chunk["file_name"],
                tokens=chunk["tokens"]
            )
            for chunk in chunks
        ]
        return ChunkingPreviewResponse(
            success=True,
            file_name=request.file_name,
            tema=request.tema,
            chunks=chunk_previews,
            message="Preview generado exitosamente"
        )
    except Exception as e:
        logger.error(f"Error generando preview: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error generando preview: {str(e)}"
        )
@router.post("/process", response_model=ChunkingProcessResponse)
 async def process_pdf_full(request: ChunkingProcessRequest):
    """
    Procesa un PDF completo y lo sube a Qdrant.
    Este endpoint:
    1. Descarga el PDF desde Azure Blob
    2. Lo procesa en chunks con control de tokens
    3. Genera embeddings con Azure OpenAI
    4. Sube los chunks a Qdrant con IDs determinísticos
    Args:
        request: Configuración de chunking y destino
    Returns:
        Resultado del procesamiento con estadísticas
    Raises:
        HTTPException: Si hay error procesando el PDF
    """
    try:
        logger.info(f"Procesando PDF completo: {request.file_name} (tema: {request.tema})")
        chunking_service = get_chunking_service()
        result = await chunking_service.process_pdf_full(
            file_name=request.file_name,
            tema=request.tema,
            collection_name=request.collection_name,
            max_tokens=request.max_tokens,
            target_tokens=request.target_tokens,
            chunk_size=request.chunk_size,
            chunk_overlap=request.chunk_overlap,
            use_llm=request.use_llm,
            custom_instructions=request.custom_instructions
        )
        return ChunkingProcessResponse(**result)
    except Exception as e:
        logger.error(f"Error procesando PDF: {e}", exc_info=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error procesando PDF: {str(e)}"
        )
--- a/backend/app/routers/vectors.py
+++ b/backend/app/routers/vectors.py
@@ -0,0 +1,277 @@
 """
 Router para endpoints de operaciones con bases de datos vectoriales.
 Este módulo define todos los endpoints de la API relacionados con
 la gestión de colecciones y chunks en bases de datos vectoriales.
 """
 import logging
 from fastapi import APIRouter, HTTPException, status, Query
 from typing import Optional
 from app.services.vector_service import vector_service
 from app.models.vector_models import (
    CollectionExistsRequest,
    CollectionExistsResponse,
    CollectionCreateRequest,
    CollectionCreateResponse,
    CollectionDeleteResponse,
    CollectionInfoResponse,
    FileExistsInCollectionRequest,
    FileExistsInCollectionResponse,
    GetChunksByFileRequest,
    GetChunksByFileResponse,
    DeleteFileFromCollectionRequest,
    DeleteFileFromCollectionResponse,
    AddChunksRequest,
    AddChunksResponse,
    VectorDBHealthResponse,
    VectorDBErrorResponse
 )
 logger = logging.getLogger(__name__)
 router = APIRouter(
    prefix="/vectors",
    tags=["Vectors"],
    responses={
        500: {"model": VectorDBErrorResponse, "description": "Error interno del servidor"}
    }
 )
 # ============================================================================
 # Endpoints de Health Check
 # ============================================================================
@router.get(
    "/health",
    response_model=VectorDBHealthResponse,
    summary="Verificar estado de la base de datos vectorial",
    description="Verifica que la conexión con la base de datos vectorial esté funcionando correctamente"
 )
 async def health_check():
    """Health check de la base de datos vectorial."""
    try:
        return await vector_service.health_check()
    except Exception as e:
        logger.error(f"Error en health check: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al verificar estado de la base de datos: {str(e)}"
        )
 # ============================================================================
 # Endpoints de Colecciones
 # ============================================================================
@router.post(
    "/collections/exists",
    response_model=CollectionExistsResponse,
    summary="Verificar si una colección existe",
    description="Verifica si existe una colección con el nombre especificado"
 )
 async def check_collection_exists(request: CollectionExistsRequest):
    """Verifica si una colección existe."""
    try:
        return await vector_service.check_collection_exists(request.collection_name)
    except Exception as e:
        logger.error(f"Error al verificar colección: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al verificar colección: {str(e)}"
        )
@router.post(
    "/collections/create",
    response_model=CollectionCreateResponse,
    status_code=status.HTTP_201_CREATED,
    summary="Crear una nueva colección",
    description="Crea una nueva colección en la base de datos vectorial"
 )
 async def create_collection(request: CollectionCreateRequest):
    """Crea una nueva colección."""
    try:
        return await vector_service.create_collection(request)
    except ValueError as e:
        logger.warning(f"Error de validación al crear colección: {e}")
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=str(e)
        )
    except Exception as e:
        logger.error(f"Error al crear colección: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al crear colección: {str(e)}"
        )
@router.delete(
    "/collections/{collection_name}",
    response_model=CollectionDeleteResponse,
    summary="Eliminar una colección",
    description="Elimina completamente una colección y todos sus datos"
 )
 async def delete_collection(collection_name: str):
    """Elimina una colección completa."""
    try:
        return await vector_service.delete_collection(collection_name)
    except ValueError as e:
        logger.warning(f"Error de validación al eliminar colección: {e}")
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=str(e)
        )
    except Exception as e:
        logger.error(f"Error al eliminar colección: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al eliminar colección: {str(e)}"
        )
@router.get(
    "/collections/{collection_name}/info",
    response_model=CollectionInfoResponse,
    summary="Obtener información de una colección",
    description="Obtiene información detallada sobre una colección"
 )
 async def get_collection_info(collection_name: str):
    """Obtiene información de una colección."""
    try:
        info = await vector_service.get_collection_info(collection_name)
        if info is None:
            raise HTTPException(
                status_code=status.HTTP_404_NOT_FOUND,
                detail=f"Colección '{collection_name}' no encontrada"
            )
        return info
    except HTTPException:
        raise
    except Exception as e:
        logger.error(f"Error al obtener info de colección: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al obtener información de colección: {str(e)}"
        )
 # ============================================================================
 # Endpoints de Archivos en Colecciones
 # ============================================================================
@router.post(
    "/files/exists",
    response_model=FileExistsInCollectionResponse,
    summary="Verificar si un archivo existe en una colección",
    description="Verifica si un archivo específico existe en una colección"
 )
 async def check_file_exists_in_collection(request: FileExistsInCollectionRequest):
    """Verifica si un archivo existe en una colección."""
    try:
        return await vector_service.check_file_exists_in_collection(
            request.collection_name,
            request.file_name
        )
    except Exception as e:
        logger.error(f"Error al verificar archivo en colección: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al verificar archivo: {str(e)}"
        )
@router.get(
    "/collections/{collection_name}/files/{file_name}/chunks",
    response_model=GetChunksByFileResponse,
    summary="Obtener chunks de un archivo",
    description="Obtiene todos los chunks de un archivo específico en una colección"
 )
 async def get_chunks_by_file(
    collection_name: str,
    file_name: str,
    limit: Optional[int] = Query(None, description="Límite de chunks a retornar")
 ):
    """Obtiene todos los chunks de un archivo."""
    try:
        return await vector_service.get_chunks_by_file(
            collection_name,
            file_name,
            limit
        )
    except ValueError as e:
        logger.warning(f"Error de validación al obtener chunks: {e}")
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=str(e)
        )
    except Exception as e:
        logger.error(f"Error al obtener chunks: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al obtener chunks: {str(e)}"
        )
@router.delete(
    "/collections/{collection_name}/files/{file_name}",
    response_model=DeleteFileFromCollectionResponse,
    summary="Eliminar un archivo de una colección",
    description="Elimina todos los chunks de un archivo de una colección"
 )
 async def delete_file_from_collection(collection_name: str, file_name: str):
    """Elimina todos los chunks de un archivo."""
    try:
        return await vector_service.delete_file_from_collection(
            collection_name,
            file_name
        )
    except ValueError as e:
        logger.warning(f"Error de validación al eliminar archivo: {e}")
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=str(e)
        )
    except Exception as e:
        logger.error(f"Error al eliminar archivo: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al eliminar archivo: {str(e)}"
        )
 # ============================================================================
 # Endpoints de Chunks
 # ============================================================================
@router.post(
    "/chunks/add",
    response_model=AddChunksResponse,
    status_code=status.HTTP_201_CREATED,
    summary="Agregar chunks a una colección",
    description="Agrega múltiples chunks a una colección existente"
 )
 async def add_chunks(request: AddChunksRequest):
    """Agrega chunks a una colección."""
    try:
        return await vector_service.add_chunks(
            request.collection_name,
            request.chunks
        )
    except ValueError as e:
        logger.warning(f"Error de validación al agregar chunks: {e}")
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=str(e)
        )
    except Exception as e:
        logger.error(f"Error al agregar chunks: {e}")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=f"Error al agregar chunks: {str(e)}"
        )
--- a/backend/app/services/chunking_service.py
+++ b/backend/app/services/chunking_service.py
@@ -0,0 +1,316 @@
 """
 Servicio de chunking que orquesta todo el proceso:
 - Descarga PDF desde Azure Blob
 - Procesa con pipeline de chunking
 - Genera embeddings con Azure OpenAI
 - Sube a Qdrant con IDs determinísticos
 """
 import logging
 import uuid
 from typing import List, Dict, Any, Optional
 from io import BytesIO
 from azure.storage.blob import BlobServiceClient
 from langchain_core.documents import Document
 from ..core.config import settings
 from ..utils.chunking import (
    process_pdf_with_token_control,
    get_gemini_client,
    GeminiClient
 )
 from ..services.embedding_service import get_embedding_service
 from ..vector_db.factory import get_vector_db
 logger = logging.getLogger(__name__)
 class ChunkingService:
    """Servicio para procesar PDFs y subirlos a Qdrant"""
    def __init__(self):
        """Inicializa el servicio con conexiones a Azure Blob y clientes"""
        self.blob_service = BlobServiceClient.from_connection_string(
            settings.AZURE_STORAGE_CONNECTION_STRING
        )
        self.container_name = settings.AZURE_CONTAINER_NAME
        self.embedding_service = get_embedding_service()
        self.vector_db = get_vector_db()
    def _generate_deterministic_id(
        self,
        file_name: str,
        page: int,
        chunk_index: int
    ) -> str:
        """
        Genera un ID determinístico para un chunk usando UUID v5.
        Args:
            file_name: Nombre del archivo
            page: Número de página
            chunk_index: Índice del chunk dentro de la página
        Returns:
            ID en formato UUID válido para Qdrant
        """
        id_string = f"{file_name}_{page}_{chunk_index}"
        # Usar UUID v5 con namespace DNS para generar UUID determinístico
        return str(uuid.uuid5(uuid.NAMESPACE_DNS, id_string))
    async def download_pdf_from_blob(
        self,
        file_name: str,
        tema: str
    ) -> bytes:
        """
        Descarga un PDF desde Azure Blob Storage.
        Args:
            file_name: Nombre del archivo
            tema: Tema/carpeta del archivo
        Returns:
            Contenido del PDF en bytes
        Raises:
            Exception: Si hay error descargando el archivo
        """
        try:
            blob_path = f"{tema}/{file_name}"
            logger.info(f"Descargando PDF: {blob_path}")
            blob_client = self.blob_service.get_blob_client(
                container=self.container_name,
                blob=blob_path
            )
            pdf_bytes = blob_client.download_blob().readall()
            logger.info(f"PDF descargado: {len(pdf_bytes)} bytes")
            return pdf_bytes
        except Exception as e:
            logger.error(f"Error descargando PDF: {e}")
            raise
    async def process_pdf_preview(
        self,
        file_name: str,
        tema: str,
        max_tokens: int = 950,
        target_tokens: int = 800,
        chunk_size: int = 1000,
        chunk_overlap: int = 200,
        use_llm: bool = True,
        custom_instructions: str = ""
    ) -> List[Dict[str, Any]]:
        """
        Procesa un PDF y genera exactamente 3 chunks de preview.
        Args:
            file_name: Nombre del archivo PDF
            tema: Tema/carpeta del archivo
            max_tokens: Límite máximo de tokens por chunk
            target_tokens: Tokens objetivo
            chunk_size: Tamaño del chunk
            chunk_overlap: Solapamiento
            use_llm: Si True, usa Gemini para procesamiento inteligente
            custom_instructions: Instrucciones personalizadas (solo si use_llm=True)
        Returns:
            Lista con exactamente 3 chunks de preview con metadata
        """
        try:
            logger.info(f"Generando preview para {file_name} (tema: {tema})")
            # Descargar PDF
            pdf_bytes = await self.download_pdf_from_blob(file_name, tema)
            # Configurar cliente Gemini si está habilitado
            gemini_client = get_gemini_client() if use_llm else None
            # Si LLM está deshabilitado, ignorar custom_instructions
            instructions = custom_instructions if use_llm else ""
            # Procesar PDF
            chunks = process_pdf_with_token_control(
                pdf_bytes=pdf_bytes,
                file_name=file_name,
                max_tokens=max_tokens,
                target_tokens=target_tokens,
                chunk_size=chunk_size,
                chunk_overlap=chunk_overlap,
                merge_related=True,
                gemini_client=gemini_client,
                custom_instructions=instructions,
                extract_images=False  # Deshabilitado según requerimientos
            )
            # Tomar los primeros chunks para preview (máximo 3, mínimo 1)
            preview_chunks = chunks[:min(3, len(chunks))] if chunks else []
            # Formatear para respuesta
            result = []
            for idx, chunk in enumerate(preview_chunks):
                result.append({
                    "index": idx,
                    "text": chunk.page_content,
                    "page": chunk.metadata.get("page", 0),
                    "file_name": chunk.metadata.get("file_name", file_name),
                    "tokens": len(chunk.page_content.split())  # Aproximación
                })
            logger.info(f"Preview generado: {len(result)} chunks")
            return result
        except Exception as e:
            logger.error(f"Error generando preview: {e}")
            raise
    async def process_pdf_full(
        self,
        file_name: str,
        tema: str,
        collection_name: str,
        max_tokens: int = 950,
        target_tokens: int = 800,
        chunk_size: int = 1000,
        chunk_overlap: int = 200,
        use_llm: bool = True,
        custom_instructions: str = "",
        progress_callback: Optional[callable] = None
    ) -> Dict[str, Any]:
        """
        Procesa un PDF completo y lo sube a Qdrant.
        Args:
            file_name: Nombre del archivo PDF
            tema: Tema/carpeta del archivo
            collection_name: Nombre de la colección en Qdrant
            max_tokens: Límite máximo de tokens por chunk
            target_tokens: Tokens objetivo
            chunk_size: Tamaño del chunk
            chunk_overlap: Solapamiento
            use_llm: Si True, usa Gemini para procesamiento inteligente
            custom_instructions: Instrucciones personalizadas (solo si use_llm=True)
            progress_callback: Callback para reportar progreso
        Returns:
            Diccionario con resultados del procesamiento
        """
        try:
            logger.info(f"Procesando PDF completo: {file_name} (tema: {tema})")
            if progress_callback:
                await progress_callback({"status": "downloading", "progress": 0})
            # 1. Descargar PDF
            pdf_bytes = await self.download_pdf_from_blob(file_name, tema)
            if progress_callback:
                await progress_callback({"status": "chunking", "progress": 20})
            # 2. Configurar cliente Gemini
            gemini_client = get_gemini_client() if use_llm else None
            instructions = custom_instructions if use_llm else ""
            # 3. Procesar PDF
            chunks = process_pdf_with_token_control(
                pdf_bytes=pdf_bytes,
                file_name=file_name,
                max_tokens=max_tokens,
                target_tokens=target_tokens,
                chunk_size=chunk_size,
                chunk_overlap=chunk_overlap,
                merge_related=True,
                gemini_client=gemini_client,
                custom_instructions=instructions,
                extract_images=False
            )
            if progress_callback:
                await progress_callback({"status": "embedding", "progress": 50})
            # 4. Generar embeddings
            texts = [chunk.page_content for chunk in chunks]
            logger.info(f"Generando embeddings para {len(texts)} chunks")
            embeddings = await self.embedding_service.generate_embeddings_batch(texts)
            logger.info(f"Embeddings generados: {len(embeddings)} vectores de dimensión {len(embeddings[0]) if embeddings else 0}")
            if progress_callback:
                await progress_callback({"status": "uploading", "progress": 80})
            # 5. Preparar chunks para Qdrant con IDs determinísticos
            qdrant_chunks = []
            page_chunk_count = {}  # Contador de chunks por página
            logger.info(f"Preparando {len(chunks)} chunks con {len(embeddings)} embeddings para subir")
            for chunk, embedding in zip(chunks, embeddings):
                page = chunk.metadata.get("page", 0)
                # Incrementar contador para esta página
                if page not in page_chunk_count:
                    page_chunk_count[page] = 0
                chunk_index = page_chunk_count[page]
                page_chunk_count[page] += 1
                # Generar ID determinístico
                chunk_id = self._generate_deterministic_id(
                    file_name=file_name,
                    page=page,
                    chunk_index=chunk_index
                )
                qdrant_chunks.append({
                    "id": chunk_id,
                    "vector": embedding,
                    "payload": {
                        "page_content": chunk.page_content,
                        "metadata": {
                            "page": page,
                            "file_name": file_name
                        }
                    }
                })
            # 6. Subir a Qdrant
            logger.info(f"Subiendo {len(qdrant_chunks)} chunks a Qdrant colección '{collection_name}'")
            result = await self.vector_db.add_chunks(collection_name, qdrant_chunks)
            logger.info(f"Resultado de upsert: {result}")
            if progress_callback:
                await progress_callback({"status": "completed", "progress": 100})
            logger.info(f"Procesamiento completo: {result['chunks_added']} chunks subidos")
            return {
                "success": True,
                "collection_name": collection_name,
                "file_name": file_name,
                "total_chunks": len(chunks),
                "chunks_added": result['chunks_added'],
                "message": "PDF procesado y subido exitosamente"
            }
        except Exception as e:
            logger.error(f"Error procesando PDF completo: {e}")
            if progress_callback:
                await progress_callback({"status": "error", "progress": 0, "error": str(e)})
            raise
 # Instancia global singleton
 _chunking_service: ChunkingService | None = None
 def get_chunking_service() -> ChunkingService:
    """
    Obtiene la instancia singleton del servicio de chunking.
    Returns:
        Instancia de ChunkingService
    """
    global _chunking_service
    if _chunking_service is None:
        _chunking_service = ChunkingService()
    return _chunking_service
--- a/backend/app/services/embedding_service.py
+++ b/backend/app/services/embedding_service.py
@@ -0,0 +1,127 @@
 """
 Servicio de embeddings usando Azure OpenAI.
 Genera embeddings para chunks de texto usando text-embedding-3-large (3072 dimensiones).
 """
 import logging
 from typing import List
 from openai import AzureOpenAI
 from ..core.config import settings
 logger = logging.getLogger(__name__)
 class EmbeddingService:
    """Servicio para generar embeddings usando Azure OpenAI"""
    def __init__(self):
        """Inicializa el cliente de Azure OpenAI"""
        try:
            self.client = AzureOpenAI(
                api_key=settings.AZURE_OPENAI_API_KEY,
                api_version=settings.AZURE_OPENAI_API_VERSION,
                azure_endpoint=settings.AZURE_OPENAI_ENDPOINT
            )
            self.model = settings.AZURE_OPENAI_EMBEDDING_DEPLOYMENT
            self.embedding_dimension = 3072
            logger.info(f"EmbeddingService inicializado con modelo {self.model}")
        except Exception as e:
            logger.error(f"Error inicializando EmbeddingService: {e}")
            raise
    async def generate_embedding(self, text: str) -> List[float]:
        """
        Genera un embedding para un texto individual.
        Args:
            text: Texto para generar embedding
        Returns:
            Vector de embedding (3072 dimensiones)
        Raises:
            Exception: Si hay error al generar el embedding
        """
        try:
            response = self.client.embeddings.create(
                input=[text],
                model=self.model
            )
            embedding = response.data[0].embedding
            if len(embedding) != self.embedding_dimension:
                raise ValueError(
                    f"Dimensión incorrecta: esperada {self.embedding_dimension}, "
                    f"obtenida {len(embedding)}"
                )
            return embedding
        except Exception as e:
            logger.error(f"Error generando embedding: {e}")
            raise
    async def generate_embeddings_batch(
        self,
        texts: List[str],
        batch_size: int = 100
    ) -> List[List[float]]:
        """
        Genera embeddings para múltiples textos en lotes.
        Args:
            texts: Lista de textos para generar embeddings
            batch_size: Tamaño del lote para procesamiento (default: 100)
        Returns:
            Lista de vectores de embeddings
        Raises:
            Exception: Si hay error al generar los embeddings
        """
        try:
            embeddings = []
            for i in range(0, len(texts), batch_size):
                batch = texts[i:i + batch_size]
                logger.info(f"Procesando lote {i//batch_size + 1}/{(len(texts)-1)//batch_size + 1}")
                response = self.client.embeddings.create(
                    input=batch,
                    model=self.model
                )
                batch_embeddings = [item.embedding for item in response.data]
                # Validar dimensiones
                for idx, emb in enumerate(batch_embeddings):
                    if len(emb) != self.embedding_dimension:
                        raise ValueError(
                            f"Dimensión incorrecta en índice {i + idx}: "
                            f"esperada {self.embedding_dimension}, obtenida {len(emb)}"
                        )
                embeddings.extend(batch_embeddings)
            logger.info(f"Generados {len(embeddings)} embeddings exitosamente")
            return embeddings
        except Exception as e:
            logger.error(f"Error generando embeddings en lote: {e}")
            raise
 # Instancia global singleton
 _embedding_service: EmbeddingService | None = None
 def get_embedding_service() -> EmbeddingService:
    """
    Obtiene la instancia singleton del servicio de embeddings.
    Returns:
        Instancia de EmbeddingService
    """
    global _embedding_service
    if _embedding_service is None:
        _embedding_service = EmbeddingService()
    return _embedding_service
--- a/backend/app/services/vector_service.py
+++ b/backend/app/services/vector_service.py
@@ -0,0 +1,442 @@
 """
 Servicio de lógica de negocio para operaciones con bases de datos vectoriales.
 Este módulo contiene toda la lógica de negocio relacionada con la gestión
 de colecciones y chunks en bases de datos vectoriales.
 """
 import logging
 from typing import List, Dict, Any, Optional
 from app.vector_db import get_vector_db
 from app.models.vector_models import (
    CollectionCreateRequest,
    CollectionCreateResponse,
    CollectionDeleteResponse,
    CollectionExistsResponse,
    CollectionInfoResponse,
    FileExistsInCollectionResponse,
    GetChunksByFileResponse,
    DeleteFileFromCollectionResponse,
    AddChunksResponse,
    VectorDBHealthResponse,
    VectorDBErrorResponse
 )
 logger = logging.getLogger(__name__)
 class VectorService:
    """
    Servicio para gestionar operaciones con bases de datos vectoriales.
    Este servicio actúa como una capa intermedia entre los routers y
    la implementación de la base de datos vectorial.
    """
    def __init__(self):
        """Inicializa el servicio con la instancia de la base de datos vectorial."""
        self.vector_db = get_vector_db()
    async def check_collection_exists(self, collection_name: str) -> CollectionExistsResponse:
        """
        Verifica si una colección existe.
        Args:
            collection_name: Nombre de la colección
        Returns:
            CollectionExistsResponse: Response con el resultado
        """
        try:
            exists = await self.vector_db.collection_exists(collection_name)
            logger.info(f"Verificación de colección '{collection_name}': {exists}")
            return CollectionExistsResponse(
                exists=exists,
                collection_name=collection_name
            )
        except Exception as e:
            logger.error(f"Error al verificar colección '{collection_name}': {e}")
            raise
    async def create_collection(
        self,
        request: CollectionCreateRequest
    ) -> CollectionCreateResponse:
        """
        Crea una nueva colección.
        Args:
            request: Request con los datos de la colección
        Returns:
            CollectionCreateResponse: Response con el resultado
        Raises:
            ValueError: Si la colección ya existe
        """
        try:
            # Verificar si ya existe
            exists = await self.vector_db.collection_exists(request.collection_name)
            if exists:
                logger.warning(f"Intento de crear colección existente: '{request.collection_name}'")
                raise ValueError(f"La colección '{request.collection_name}' ya existe")
            # Crear la colección
            success = await self.vector_db.create_collection(
                collection_name=request.collection_name,
                vector_size=request.vector_size,
                distance=request.distance
            )
            if success:
                logger.info(f"Colección '{request.collection_name}' creada exitosamente")
                return CollectionCreateResponse(
                    success=True,
                    collection_name=request.collection_name,
                    message=f"Colección '{request.collection_name}' creada exitosamente"
                )
            else:
                logger.error(f"Fallo al crear colección '{request.collection_name}'")
                raise Exception(f"No se pudo crear la colección '{request.collection_name}'")
        except ValueError:
            raise
        except Exception as e:
            logger.error(f"Error al crear colección '{request.collection_name}': {e}")
            raise
    async def delete_collection(self, collection_name: str) -> CollectionDeleteResponse:
        """
        Elimina una colección completa.
        Args:
            collection_name: Nombre de la colección
        Returns:
            CollectionDeleteResponse: Response con el resultado
        Raises:
            ValueError: Si la colección no existe
        """
        try:
            # Verificar que existe
            exists = await self.vector_db.collection_exists(collection_name)
            if not exists:
                logger.warning(f"Intento de eliminar colección inexistente: '{collection_name}'")
                raise ValueError(f"La colección '{collection_name}' no existe")
            # Eliminar la colección
            success = await self.vector_db.delete_collection(collection_name)
            if success:
                logger.info(f"Colección '{collection_name}' eliminada exitosamente")
                return CollectionDeleteResponse(
                    success=True,
                    collection_name=collection_name,
                    message=f"Colección '{collection_name}' eliminada exitosamente"
                )
            else:
                logger.error(f"Fallo al eliminar colección '{collection_name}'")
                raise Exception(f"No se pudo eliminar la colección '{collection_name}'")
        except ValueError:
            raise
        except Exception as e:
            logger.error(f"Error al eliminar colección '{collection_name}': {e}")
            raise
    async def get_collection_info(self, collection_name: str) -> Optional[CollectionInfoResponse]:
        """
        Obtiene información de una colección.
        Args:
            collection_name: Nombre de la colección
        Returns:
            Optional[CollectionInfoResponse]: Información de la colección o None
        """
        try:
            info = await self.vector_db.get_collection_info(collection_name)
            if info is None:
                logger.warning(f"Colección '{collection_name}' no encontrada")
                return None
            return CollectionInfoResponse(**info)
        except Exception as e:
            logger.error(f"Error al obtener info de colección '{collection_name}': {e}")
            raise
    async def check_file_exists_in_collection(
        self,
        collection_name: str,
        file_name: str
    ) -> FileExistsInCollectionResponse:
        """
        Verifica si un archivo existe en una colección.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
        Returns:
            FileExistsInCollectionResponse: Response con el resultado
        """
        try:
            # Primero verificar que la colección existe
            collection_exists = await self.vector_db.collection_exists(collection_name)
            if not collection_exists:
                logger.warning(f"Colección '{collection_name}' no existe")
                return FileExistsInCollectionResponse(
                    exists=False,
                    collection_name=collection_name,
                    file_name=file_name,
                    chunk_count=0
                )
            # Verificar si el archivo existe
            file_exists = await self.vector_db.file_exists_in_collection(
                collection_name,
                file_name
            )
            chunk_count = None
            if file_exists:
                chunk_count = await self.vector_db.count_chunks_in_file(
                    collection_name,
                    file_name
                )
            logger.info(
                f"Archivo '{file_name}' en colección '{collection_name}': "
                f"existe={file_exists}, chunks={chunk_count}"
            )
            return FileExistsInCollectionResponse(
                exists=file_exists,
                collection_name=collection_name,
                file_name=file_name,
                chunk_count=chunk_count
            )
        except Exception as e:
            logger.error(
                f"Error al verificar archivo '{file_name}' "
                f"en colección '{collection_name}': {e}"
            )
            raise
    async def get_chunks_by_file(
        self,
        collection_name: str,
        file_name: str,
        limit: Optional[int] = None
    ) -> GetChunksByFileResponse:
        """
        Obtiene todos los chunks de un archivo.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
            limit: Límite opcional de chunks
        Returns:
            GetChunksByFileResponse: Response con los chunks
        Raises:
            ValueError: Si la colección no existe
        """
        try:
            # Verificar que la colección existe
            exists = await self.vector_db.collection_exists(collection_name)
            if not exists:
                logger.warning(f"Colección '{collection_name}' no existe")
                raise ValueError(f"La colección '{collection_name}' no existe")
            # Obtener chunks
            chunks = await self.vector_db.get_chunks_by_file(
                collection_name,
                file_name,
                limit
            )
            logger.info(
                f"Obtenidos {len(chunks)} chunks del archivo '{file_name}' "
                f"de la colección '{collection_name}'"
            )
            return GetChunksByFileResponse(
                collection_name=collection_name,
                file_name=file_name,
                chunks=chunks,
                total_chunks=len(chunks)
            )
        except ValueError:
            raise
        except Exception as e:
            logger.error(
                f"Error al obtener chunks del archivo '{file_name}' "
                f"de la colección '{collection_name}': {e}"
            )
            raise
    async def delete_file_from_collection(
        self,
        collection_name: str,
        file_name: str
    ) -> DeleteFileFromCollectionResponse:
        """
        Elimina todos los chunks de un archivo de una colección.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
        Returns:
            DeleteFileFromCollectionResponse: Response con el resultado
        Raises:
            ValueError: Si la colección no existe o el archivo no está en la colección
        """
        try:
            # Verificar que la colección existe
            collection_exists = await self.vector_db.collection_exists(collection_name)
            if not collection_exists:
                logger.warning(f"Colección '{collection_name}' no existe")
                raise ValueError(f"La colección '{collection_name}' no existe")
            # Verificar que el archivo existe en la colección
            file_exists = await self.vector_db.file_exists_in_collection(
                collection_name,
                file_name
            )
            if not file_exists:
                logger.warning(
                    f"Archivo '{file_name}' no existe en colección '{collection_name}'"
                )
                raise ValueError(
                    f"El archivo '{file_name}' no existe en la colección '{collection_name}'"
                )
            # Eliminar el archivo
            chunks_deleted = await self.vector_db.delete_file_from_collection(
                collection_name,
                file_name
            )
            logger.info(
                f"Eliminados {chunks_deleted} chunks del archivo '{file_name}' "
                f"de la colección '{collection_name}'"
            )
            return DeleteFileFromCollectionResponse(
                success=True,
                collection_name=collection_name,
                file_name=file_name,
                chunks_deleted=chunks_deleted,
                message=f"Archivo '{file_name}' eliminado exitosamente ({chunks_deleted} chunks)"
            )
        except ValueError:
            raise
        except Exception as e:
            logger.error(
                f"Error al eliminar archivo '{file_name}' "
                f"de la colección '{collection_name}': {e}"
            )
            raise
    async def add_chunks(
        self,
        collection_name: str,
        chunks: List[Dict[str, Any]]
    ) -> AddChunksResponse:
        """
        Agrega chunks a una colección.
        Args:
            collection_name: Nombre de la colección
            chunks: Lista de chunks a agregar
        Returns:
            AddChunksResponse: Response con el resultado
        Raises:
            ValueError: Si la colección no existe
        """
        try:
            # Verificar que la colección existe
            exists = await self.vector_db.collection_exists(collection_name)
            if not exists:
                logger.warning(f"Colección '{collection_name}' no existe")
                raise ValueError(f"La colección '{collection_name}' no existe")
            # Agregar chunks
            success = await self.vector_db.add_chunks(collection_name, chunks)
            if success:
                logger.info(
                    f"Agregados {len(chunks)} chunks a la colección '{collection_name}'"
                )
                return AddChunksResponse(
                    success=True,
                    collection_name=collection_name,
                    chunks_added=len(chunks),
                    message=f"Se agregaron {len(chunks)} chunks exitosamente"
                )
            else:
                logger.error(f"Fallo al agregar chunks a '{collection_name}'")
                raise Exception(f"No se pudieron agregar los chunks a '{collection_name}'")
        except ValueError:
            raise
        except Exception as e:
            logger.error(f"Error al agregar chunks a '{collection_name}': {e}")
            raise
    async def health_check(self) -> VectorDBHealthResponse:
        """
        Verifica el estado de la conexión con la base de datos vectorial.
        Returns:
            VectorDBHealthResponse: Response con el estado
        """
        try:
            is_healthy = await self.vector_db.health_check()
            if is_healthy:
                return VectorDBHealthResponse(
                    status="healthy",
                    db_type="qdrant",
                    message="Conexión exitosa con la base de datos vectorial"
                )
            else:
                return VectorDBHealthResponse(
                    status="unhealthy",
                    db_type="qdrant",
                    message="No se pudo conectar con la base de datos vectorial"
                )
        except Exception as e:
            logger.error(f"Error en health check: {e}")
            return VectorDBHealthResponse(
                status="error",
                db_type="qdrant",
                message=f"Error al verificar conexión: {str(e)}"
            )
 # Instancia global del servicio
 vector_service = VectorService()
--- a/backend/app/utils/chunking/init.py
+++ b/backend/app/utils/chunking/init.py
@@ -0,0 +1,18 @@
 """
 Utilidades de chunking para procesamiento de PDFs.
 Refactorización modular del pipeline de chunking_token.py
 """
 from .gemini_client import GeminiClient, get_gemini_client
 from .token_manager import TokenManager
 from .chunk_processor import OptimizedChunkProcessor
 from .pdf_extractor import OptimizedPDFExtractor
 from .pipeline import process_pdf_with_token_control
 __all__ = [
    "GeminiClient",
    "get_gemini_client",
    "TokenManager",
    "OptimizedChunkProcessor",
    "OptimizedPDFExtractor",
    "process_pdf_with_token_control",
 ]
--- a/backend/app/utils/chunking/chunk_processor.py
+++ b/backend/app/utils/chunking/chunk_processor.py
@@ -0,0 +1,258 @@
 """
 Procesador optimizado de chunks con soporte para LLM (Gemini).
 Permite merge inteligente y mejora de chunks usando IA.
 """
 import logging
 import time
 import hashlib
 from typing import List, Optional
 from langchain_core.documents import Document
 from .token_manager import TokenManager
 from .gemini_client import GeminiClient
 logger = logging.getLogger(__name__)
 class OptimizedChunkProcessor:
    """Procesador de chunks con optimización mediante LLM"""
    def __init__(
        self,
        max_tokens: int = 1000,
        target_tokens: int = 800,
        chunks_per_batch: int = 5,
        gemini_client: Optional[GeminiClient] = None,
        model_name: str = "gpt-3.5-turbo",
        custom_instructions: str = ""
    ):
        """
        Inicializa el procesador de chunks.
        Args:
            max_tokens: Límite máximo de tokens por chunk
            target_tokens: Tokens objetivo para chunks optimizados
            chunks_per_batch: Chunks a procesar por lote
            gemini_client: Cliente de Gemini para procesamiento (opcional)
            model_name: Modelo para cálculo de tokens
            custom_instructions: Instrucciones adicionales para el prompt de optimización
        """
        self.client = gemini_client
        self.chunks_per_batch = chunks_per_batch
        self.max_tokens = max_tokens
        self.target_tokens = target_tokens
        self.token_manager = TokenManager(model_name)
        self.custom_instructions = custom_instructions
        # Caché para evitar reprocesamiento
        self._merge_cache = {}
        self._enhance_cache = {}
    def _get_cache_key(self, text: str) -> str:
        """Genera una clave de caché para el texto"""
        combined = text + self.custom_instructions
        return hashlib.md5(combined.encode()).hexdigest()[:16]
    def should_merge_chunks(self, chunk1: str, chunk2: str) -> bool:
        """
        Determina si dos chunks deben unirse basándose en continuidad semántica.
        Args:
            chunk1: Primer chunk
            chunk2: Segundo chunk
        Returns:
            True si los chunks deben unirse
        """
        cache_key = f"{self._get_cache_key(chunk1)}_{self._get_cache_key(chunk2)}"
        if cache_key in self._merge_cache:
            return self._merge_cache[cache_key]
        try:
            combined_text = f"{chunk1}\n\n{chunk2}"
            combined_tokens = self.token_manager.count_tokens(combined_text)
            if combined_tokens > self.max_tokens:
                self._merge_cache[cache_key] = False
                return False
            if self.client:
                base_prompt = f"""Analiza estos dos fragmentos de texto y determina si deben unirse.
 LÍMITES ESTRICTOS:
 - Tokens combinados: {combined_tokens}/{self.max_tokens}
 - Solo unir si hay continuidad semántica clara
 Criterios de unión:
 1. El primer fragmento termina abruptamente
 2. El segundo fragmento continúa la misma idea/concepto
 3. La unión mejora la coherencia del contenido
 4. Exceder {self.max_tokens} tokens, SOLAMENTE si es necesario para mantener el contexto
 Responde SOLO 'SI' o 'NO'.
 Fragmento 1 ({self.token_manager.count_tokens(chunk1)} tokens):
 {chunk1[:500]}...
 Fragmento 2 ({self.token_manager.count_tokens(chunk2)} tokens):
 {chunk2[:500]}..."""
                response = self.client.generate_content(base_prompt)
                result = response.strip().upper() == 'SI'
                self._merge_cache[cache_key] = result
                return result
            # Heurística simple si no hay cliente LLM
            result = (
                chunk1.rstrip().endswith(('.', '!', '?')) == False and
                combined_tokens <= self.target_tokens
            )
            self._merge_cache[cache_key] = result
            return result
        except Exception as e:
            logger.error(f"Error analizando chunks para merge: {e}")
            self._merge_cache[cache_key] = False
            return False
    def enhance_chunk(self, chunk_text: str) -> str:
        """
        Mejora un chunk usando LLM o truncamiento.
        Args:
            chunk_text: Texto del chunk a mejorar
        Returns:
            Texto del chunk mejorado
        """
        cache_key = self._get_cache_key(chunk_text)
        if cache_key in self._enhance_cache:
            return self._enhance_cache[cache_key]
        current_tokens = self.token_manager.count_tokens(chunk_text)
        try:
            if self.client and current_tokens < self.max_tokens:
                base_prompt = f"""Optimiza este texto siguiendo estas reglas ESTRICTAS:
 LÍMITES DE TOKENS:
 - Actual: {current_tokens} tokens
 - Máximo permitido: {self.max_tokens} tokens
 - Objetivo: {self.target_tokens} tokens
 REGLAS FUNDAMENTALES:
 NO exceder {self.max_tokens} tokens bajo ninguna circunstancia
 Mantener TODA la información esencial y metadatos
 NO cambiar términos técnicos o palabras clave
 Asegurar oraciones completas y coherentes
 Optimizar claridad y estructura sin añadir contenido
 SOLO devuelve el texto no agregues conclusiones NUNCA
 Si el texto está cerca del límite, NO expandir. Solo mejorar estructura."""
                if self.custom_instructions.strip():
                    base_prompt += f"\n\nINSTRUCCIONES ADICIONALES:\n{self.custom_instructions}"
                base_prompt += f"\n\nTexto a optimizar:\n{chunk_text}"
                response = self.client.generate_content(base_prompt)
                enhanced_text = response.strip()
                enhanced_tokens = self.token_manager.count_tokens(enhanced_text)
                if enhanced_tokens > self.max_tokens:
                    logger.warning(
                        f"Texto optimizado excede límite ({enhanced_tokens} > {self.max_tokens}), truncando"
                    )
                    enhanced_text = self.token_manager.truncate_to_tokens(enhanced_text, self.max_tokens)
                self._enhance_cache[cache_key] = enhanced_text
                return enhanced_text
            else:
                # Sin LLM o ya en límite, solo truncar si es necesario
                if current_tokens > self.max_tokens:
                    truncated = self.token_manager.truncate_to_tokens(chunk_text, self.max_tokens)
                    self._enhance_cache[cache_key] = truncated
                    return truncated
                self._enhance_cache[cache_key] = chunk_text
                return chunk_text
        except Exception as e:
            logger.error(f"Error procesando chunk: {e}")
            if current_tokens > self.max_tokens:
                truncated = self.token_manager.truncate_to_tokens(chunk_text, self.max_tokens)
                self._enhance_cache[cache_key] = truncated
                return truncated
            self._enhance_cache[cache_key] = chunk_text
            return chunk_text
    def process_chunks_batch(
        self,
        chunks: List[Document],
        merge_related: bool = False
    ) -> List[Document]:
        """
        Procesa un lote de chunks, aplicando merge y mejoras.
        Args:
            chunks: Lista de documentos a procesar
            merge_related: Si True, intenta unir chunks relacionados
        Returns:
            Lista de documentos procesados
        """
        processed_chunks = []
        total_chunks = len(chunks)
        logger.info(f"Procesando {total_chunks} chunks en lotes de {self.chunks_per_batch}")
        if self.custom_instructions:
            logger.info(f"Con instrucciones personalizadas: {self.custom_instructions[:100]}...")
        i = 0
        while i < len(chunks):
            batch_start = time.time()
            current_chunk = chunks[i]
            merged_content = current_chunk.page_content
            original_tokens = self.token_manager.count_tokens(merged_content)
            # Intentar merge si está habilitado
            if merge_related and i < len(chunks) - 1:
                merge_count = 0
                while (
                    i + merge_count < len(chunks) - 1 and
                    self.should_merge_chunks(
                        merged_content,
                        chunks[i + merge_count + 1].page_content
                    )
                ):
                    merge_count += 1
                    merged_content += "\n\n" + chunks[i + merge_count].page_content
                    logger.info(f"  Uniendo chunk {i + 1} con chunk {i + merge_count + 1}")
                i += merge_count
            logger.info(f"\nProcesando chunk {i + 1}/{total_chunks}")
            logger.info(f"  Tokens originales: {original_tokens}")
            # Mejorar chunk
            enhanced_content = self.enhance_chunk(merged_content)
            final_tokens = self.token_manager.count_tokens(enhanced_content)
            processed_chunks.append(Document(
                page_content=enhanced_content,
                metadata={
                    **current_chunk.metadata,
                }
            ))
            logger.info(f"  Tokens finales: {final_tokens}")
            logger.info(f"  Tiempo de procesamiento: {time.time() - batch_start:.2f}s")
            i += 1
            if i % self.chunks_per_batch == 0 and i < len(chunks):
                logger.info(f"\nCompletados {i}/{total_chunks} chunks")
                time.sleep(0.1)
        return processed_chunks
--- a/backend/app/utils/chunking/gemini_client.py
+++ b/backend/app/utils/chunking/gemini_client.py
@@ -0,0 +1,91 @@
 """
 Cliente para interactuar con Gemini (Google Vertex AI).
 Usado para procesamiento inteligente de chunks con LLM.
 """
 import logging
 import os
 import google.oauth2.service_account as sa
 import vertexai.generative_models as gm
 import vertexai
 from ...core.config import settings
 logger = logging.getLogger(__name__)
 class GeminiClient:
    """Cliente para generar contenido usando Gemini via Vertex AI"""
    def __init__(
        self,
        account_file: str | None = None,
        project: str | None = None,
        model: str | None = None
    ) -> None:
        """
        Inicializa el cliente de Gemini.
        Args:
            account_file: Ruta al archivo de credenciales de servicio (default: desde settings)
            project: ID del proyecto de Google Cloud (default: desde settings)
            model: Modelo de Gemini a usar (default: desde settings)
        """
        # Usar configuración de settings si no se proporciona
        account_file = account_file or settings.GOOGLE_APPLICATION_CREDENTIALS
        project = project or settings.GOOGLE_CLOUD_PROJECT
        model = model or settings.GEMINI_MODEL
        try:
            # Cargar credenciales desde archivo
            credentials = sa.Credentials.from_service_account_file(account_file)
            # Inicializar Vertex AI
            vertexai.init(
                project=project,
                credentials=credentials,
                location=settings.GOOGLE_CLOUD_LOCATION
            )
            # Inicializar modelo
            self.model = gm.GenerativeModel(model)
            logger.info(f"GeminiClient inicializado con modelo {model}")
        except Exception as e:
            logger.error(f"Error inicializando GeminiClient: {e}")
            raise
    def generate_content(self, prompt: str) -> str:
        """
        Genera contenido usando Gemini.
        Args:
            prompt: Prompt para el modelo
        Returns:
            Texto generado por el modelo
        Raises:
            Exception: Si hay error en la generación
        """
        try:
            response = self.model.generate_content(prompt)
            return response.text
        except Exception as e:
            logger.error(f"Error en Gemini: {e}")
            return ""
 # Instancia global singleton
 _gemini_client: GeminiClient | None = None
 def get_gemini_client() -> GeminiClient:
    """
    Obtiene la instancia singleton del cliente de Gemini.
    Returns:
        Instancia de GeminiClient
    """
    global _gemini_client
    if _gemini_client is None:
        _gemini_client = GeminiClient()
    return _gemini_client
--- a/backend/app/utils/chunking/pdf_extractor.py
+++ b/backend/app/utils/chunking/pdf_extractor.py
@@ -0,0 +1,299 @@
 """
 Extractor optimizado de PDFs con soporte para BytesIO y procesamiento paralelo.
 Adaptado para trabajar con Azure Blob Storage sin archivos temporales.
 """
 import logging
 import os
 import time
 import hashlib
 from typing import List, Optional, Dict, BinaryIO
 from io import BytesIO
 from concurrent.futures import ThreadPoolExecutor
 from langchain_core.documents import Document
 from pypdf import PdfReader
 from langchain_text_splitters import RecursiveCharacterTextSplitter
 from pdf2image import convert_from_bytes
 from .token_manager import TokenManager
 from .chunk_processor import OptimizedChunkProcessor
 from .gemini_client import GeminiClient
 logger = logging.getLogger(__name__)
 class OptimizedPDFExtractor:
    """Extractor optimizado de PDFs con soporte para BytesIO"""
    def __init__(
        self,
        max_tokens: int = 1000,
        target_tokens: int = 800,
        gemini_client: Optional[GeminiClient] = None,
        custom_instructions: str = "",
        extract_images: bool = False,  # Por defecto deshabilitado según requerimientos
        max_workers: int = 4
    ):
        """
        Inicializa el extractor de PDFs.
        Args:
            max_tokens: Límite máximo de tokens por chunk
            target_tokens: Tokens objetivo para chunks
            gemini_client: Cliente de Gemini (opcional)
            custom_instructions: Instrucciones adicionales para optimización
            extract_images: Si True, extrae páginas con formato especial como imágenes
            max_workers: Número máximo de workers para procesamiento paralelo
        """
        self.client = gemini_client
        self.max_workers = max_workers
        self.token_manager = TokenManager()
        self.custom_instructions = custom_instructions
        self.extract_images = extract_images
        self._format_cache = {}
        self.chunk_processor = OptimizedChunkProcessor(
            max_tokens=max_tokens,
            target_tokens=target_tokens,
            gemini_client=gemini_client,
            custom_instructions=custom_instructions
        )
    def detect_special_format_batch(self, chunks: List[Document]) -> Dict[int, bool]:
        """
        Detecta chunks con formatos especiales (tablas, diagramas, etc.) en lote.
        Args:
            chunks: Lista de chunks a analizar
        Returns:
            Diccionario con índices de chunks y si tienen formato especial
        """
        results = {}
        chunks_to_process = []
        for i, chunk in enumerate(chunks):
            cache_key = hashlib.md5(chunk.page_content.encode()).hexdigest()[:16]
            if cache_key in self._format_cache:
                results[i] = self._format_cache[cache_key]
            else:
                chunks_to_process.append((i, chunk, cache_key))
        if not chunks_to_process:
            return results
        logger.info(f"Analizando {len(chunks_to_process)} chunks para formatos especiales...")
        if self.client and len(chunks_to_process) > 1:
            with ThreadPoolExecutor(max_workers=min(self.max_workers, len(chunks_to_process))) as executor:
                futures = {
                    executor.submit(self._detect_single_format, chunk): (i, cache_key)
                    for i, chunk, cache_key in chunks_to_process
                }
                for future in futures:
                    i, cache_key = futures[future]
                    try:
                        result = future.result()
                        results[i] = result
                        self._format_cache[cache_key] = result
                    except Exception as e:
                        logger.error(f"Error procesando chunk {i}: {e}")
                        results[i] = False
                        self._format_cache[cache_key] = False
        else:
            for i, chunk, cache_key in chunks_to_process:
                result = self._detect_single_format(chunk)
                results[i] = result
                self._format_cache[cache_key] = result
        return results
    def _detect_single_format(self, chunk: Document) -> bool:
        """Detecta formato especial en un chunk individual."""
        if not self.client:
            content = chunk.page_content
            table_indicators = ['│', '├', '┼', '┤', '┬', '┴', '|', '+', '-']
            has_table_chars = any(char in content for char in table_indicators)
            has_multiple_columns = content.count('\t') > 10 or content.count('  ') > 20
            return has_table_chars or has_multiple_columns
        try:
            prompt = f"""¿Contiene este texto tablas estructuradas, diagramas ASCII, o elementos que requieren formato especial?
 Responde SOLO 'SI' o 'NO'.
 Texto:
 {chunk.page_content[:1000]}"""
            response = self.client.generate_content(prompt)
            return response.strip().upper() == 'SI'
        except Exception as e:
            logger.error(f"Error detectando formato: {e}")
            return False
    def process_pdf_from_bytes(
        self,
        pdf_bytes: bytes,
        file_name: str,
        chunk_size: int = 1000,
        chunk_overlap: int = 200,
        merge_related: bool = True
    ) -> List[Document]:
        """
        Procesa un PDF desde bytes (BytesIO).
        Args:
            pdf_bytes: Contenido del PDF en bytes
            file_name: Nombre del archivo PDF
            chunk_size: Tamaño del chunk
            chunk_overlap: Solapamiento entre chunks
            merge_related: Si True, intenta unir chunks relacionados
        Returns:
            Lista de documentos procesados
        """
        overall_start = time.time()
        logger.info(f"\n=== Iniciando procesamiento optimizado de PDF: {file_name} ===")
        logger.info(f"Configuración:")
        logger.info(f"  - Tokens máximos por chunk: {self.chunk_processor.max_tokens}")
        logger.info(f"  - Tokens objetivo: {self.chunk_processor.target_tokens}")
        logger.info(f"  - Chunk size: {chunk_size}")
        logger.info(f"  - Chunk overlap: {chunk_overlap}")
        logger.info(f"  - Merge relacionados: {merge_related}")
        logger.info(f"  - Extraer imágenes: {'✅' if self.extract_images else '❌'}")
        if self.custom_instructions:
            logger.info(f"  - Instrucciones personalizadas: {self.custom_instructions[:100]}...")
        logger.info(f"\n1. Creando chunks del PDF...")
        chunks = self._create_optimized_chunks_from_bytes(
            pdf_bytes,
            file_name,
            chunk_size,
            chunk_overlap
        )
        logger.info(f"  Total chunks creados: {len(chunks)}")
        # Nota: La extracción de imágenes desde bytes no se implementa por ahora
        # ya que extract_images está deshabilitado por defecto según requerimientos
        if self.extract_images:
            logger.warning("Extracción de imágenes desde bytes no implementada aún")
        logger.info(f"\n2. Procesando y optimizando chunks...")
        processed_chunks = self.chunk_processor.process_chunks_batch(chunks, merge_related)
        total_time = time.time() - overall_start
        if processed_chunks:
            avg_tokens = sum(
                self.token_manager.count_tokens(chunk.page_content)
                for chunk in processed_chunks
            ) / len(processed_chunks)
        else:
            avg_tokens = 0
        logger.info(f"\n=== Procesamiento completado ===")
        logger.info(f"  Tiempo total: {total_time:.2f}s")
        logger.info(f"  Chunks procesados: {len(processed_chunks)}")
        logger.info(f"  Tokens promedio por chunk: {avg_tokens:.1f}")
        if self.custom_instructions:
            logger.info(f"  Custom instructions aplicadas: ✅")
        return processed_chunks
    def _create_optimized_chunks_from_bytes(
        self,
        pdf_bytes: bytes,
        file_name: str,
        chunk_size: int,
        chunk_overlap: int
    ) -> List[Document]:
        """
        Crea chunks optimizados desde bytes del PDF.
        Args:
            pdf_bytes: Contenido del PDF en bytes
            file_name: Nombre del archivo
            chunk_size: Tamaño del chunk
            chunk_overlap: Solapamiento entre chunks
        Returns:
            Lista de documentos con chunks
        """
        logger.info(f"  Leyendo PDF desde bytes: {file_name}")
        # Crear BytesIO para pypdf
        pdf_buffer = BytesIO(pdf_bytes)
        pdf = PdfReader(pdf_buffer)
        chunks = []
        text_splitter = RecursiveCharacterTextSplitter(
            chunk_size=chunk_size,
            chunk_overlap=chunk_overlap,
            length_function=self.token_manager.count_tokens,
            separators=["\n\n", "\n", ". ", " ", ""]
        )
        # Extraer todo el texto concatenado con tracking de páginas
        full_text = ""
        page_boundaries = []  # Lista de (char_position, page_num)
        for page_num, page in enumerate(pdf.pages, 1):
            text = page.extract_text()
            if text.strip():
                page_start = len(full_text)
                full_text += text
                # Agregar separador entre páginas (excepto después de la última)
                if page_num < len(pdf.pages):
                    full_text += "\n\n"
                page_end = len(full_text)
                page_boundaries.append((page_start, page_end, page_num))
        if not full_text.strip():
            return []
        # Dividir el texto completo (esto permite overlap entre páginas)
        text_chunks = text_splitter.split_text(full_text)
        logger.info(f"  Total de chunks generados por splitter: {len(text_chunks)}")
        if len(text_chunks) >= 2:
            # Verificar overlap entre primer y segundo chunk
            chunk0_end = text_chunks[0][-100:] if len(text_chunks[0]) > 100 else text_chunks[0]
            chunk1_start = text_chunks[1][:100] if len(text_chunks[1]) > 100 else text_chunks[1]
            logger.info(f"  Chunk 0 termina con: ...{chunk0_end}")
            logger.info(f"  Chunk 1 empieza con: {chunk1_start}...")
        # Asignar página a cada chunk basándonos en su posición en el texto original
        chunks = []
        current_search_pos = 0
        for chunk_text in text_chunks:
            # Buscar donde aparece este chunk en el texto completo
            chunk_pos = full_text.find(chunk_text, current_search_pos)
            if chunk_pos == -1:
                # Si no lo encontramos, usar la última posición conocida
                chunk_pos = current_search_pos
            # Determinar la página basándonos en la posición del inicio del chunk
            chunk_page = 1
            for start, end, page_num in page_boundaries:
                if chunk_pos >= start and chunk_pos < end:
                    chunk_page = page_num
                    break
                elif chunk_pos >= end:
                    # El chunk está después de esta página, continuar buscando
                    chunk_page = page_num  # Guardar la última página vista
            chunks.append(Document(
                page_content=chunk_text,
                metadata={
                    "page": chunk_page,
                    "file_name": file_name,
                }
            ))
            # Actualizar posición de búsqueda para el siguiente chunk
            current_search_pos = chunk_pos + len(chunk_text)
        return chunks
--- a/backend/app/utils/chunking/pipeline.py
+++ b/backend/app/utils/chunking/pipeline.py
@@ -0,0 +1,65 @@
 """
 Pipeline principal para procesar PDFs con control de tokens.
 Función de alto nivel que orquesta el proceso completo de chunking.
 """
 import logging
 from typing import List, Optional
 from langchain_core.documents import Document
 from .pdf_extractor import OptimizedPDFExtractor
 from .gemini_client import GeminiClient
 logger = logging.getLogger(__name__)
 def process_pdf_with_token_control(
    pdf_bytes: bytes,
    file_name: str,
    max_tokens: int = 950,
    target_tokens: int = 800,
    chunk_size: int = 1000,
    chunk_overlap: int = 200,
    merge_related: bool = True,
    gemini_client: Optional[GeminiClient] = None,
    custom_instructions: str = "",
    extract_images: bool = False
 ) -> List[Document]:
    """
    Función principal para procesar PDFs con control completo de tokens.
    Args:
        pdf_bytes: Contenido del PDF en bytes
        file_name: Nombre del archivo PDF
        max_tokens: Límite máximo de tokens por chunk
        target_tokens: Tokens objetivo para optimización
        chunk_size: Tamaño base de chunks
        chunk_overlap: Solapamiento entre chunks
        merge_related: Si unir chunks relacionados
        gemini_client: Cliente de Gemini (opcional, para LLM processing)
        custom_instructions: Instrucciones adicionales para optimización
        extract_images: Si True, extrae páginas con formato especial como imágenes
    Returns:
        Lista de documentos procesados con metadata simple (page, file_name)
    """
    logger.info(f"Iniciando pipeline de chunking para {file_name}")
    extractor = OptimizedPDFExtractor(
        max_tokens=max_tokens,
        target_tokens=target_tokens,
        gemini_client=gemini_client,
        custom_instructions=custom_instructions,
        extract_images=extract_images,
        max_workers=4
    )
    chunks = extractor.process_pdf_from_bytes(
        pdf_bytes=pdf_bytes,
        file_name=file_name,
        chunk_size=chunk_size,
        chunk_overlap=chunk_overlap,
        merge_related=merge_related
    )
    logger.info(f"Pipeline completado: {len(chunks)} chunks generados")
    return chunks
--- a/backend/app/utils/chunking/token_manager.py
+++ b/backend/app/utils/chunking/token_manager.py
@@ -0,0 +1,72 @@
 """
 Gestor de tokens para contar y truncar texto basado en modelos de tokenización.
 """
 import logging
 import tiktoken
 logger = logging.getLogger(__name__)
 class TokenManager:
    """Gestor para contar y truncar tokens usando tiktoken"""
    def __init__(self, model_name: str = "gpt-3.5-turbo"):
        """
        Inicializa el gestor de tokens.
        Args:
            model_name: Nombre del modelo para la codificación de tokens
        """
        try:
            self.encoding = tiktoken.encoding_for_model(model_name)
        except KeyError:
            logger.warning(
                f"Modelo {model_name} no encontrado, usando codificación por defecto cl100k_base"
            )
            self.encoding = tiktoken.get_encoding("cl100k_base")
    def count_tokens(self, text: str) -> int:
        """
        Cuenta el número de tokens en un texto.
        Args:
            text: Texto a analizar
        Returns:
            Número de tokens
        """
        return len(self.encoding.encode(text))
    def truncate_to_tokens(
        self,
        text: str,
        max_tokens: int,
        preserve_sentences: bool = True
    ) -> str:
        """
        Trunca texto a un número máximo de tokens.
        Args:
            text: Texto a truncar
            max_tokens: Número máximo de tokens
            preserve_sentences: Si True, intenta mantener oraciones completas
        Returns:
            Texto truncado
        """
        tokens = self.encoding.encode(text)
        if len(tokens) <= max_tokens:
            return text
        truncated_tokens = tokens[:max_tokens]
        truncated_text = self.encoding.decode(truncated_tokens)
        if preserve_sentences:
            # Intentar cortar en el último punto
            last_period = truncated_text.rfind('.')
            # Solo cortar si el punto está en el último 30% del texto
            if last_period > len(truncated_text) * 0.7:
                return truncated_text[:last_period + 1]
        return truncated_text
--- a/backend/app/vector_db/init.py
+++ b/backend/app/vector_db/init.py
@@ -0,0 +1,12 @@
 """
 Vector Database Module
 Este módulo proporciona una abstracción para trabajar con bases de datos vectoriales.
 Utiliza el patrón Repository para permitir cambiar fácilmente entre diferentes
 implementaciones (Qdrant, Pinecone, Weaviate, etc.).
 """
 from .base import VectorDBBase
 from .factory import get_vector_db
 __all__ = ["VectorDBBase", "get_vector_db"]
--- a/backend/app/vector_db/base.py
+++ b/backend/app/vector_db/base.py
@@ -0,0 +1,189 @@
 """
 Clase abstracta base para operaciones con bases de datos vectoriales.
 Este módulo define la interfaz que todas las implementaciones de bases de datos
 vectoriales deben seguir, permitiendo cambiar fácilmente entre diferentes proveedores.
 """
 from abc import ABC, abstractmethod
 from typing import List, Dict, Any, Optional
 class VectorDBBase(ABC):
    """
    Clase abstracta que define las operaciones básicas para una base de datos vectorial.
    Esta interfaz permite implementar el patrón Repository/Strategy para
    abstraer la lógica de acceso a datos vectoriales.
    """
    @abstractmethod
    async def collection_exists(self, collection_name: str) -> bool:
        """
        Verifica si existe una colección con el nombre especificado.
        Args:
            collection_name: Nombre de la colección a verificar
        Returns:
            bool: True si la colección existe, False en caso contrario
        """
        pass
    @abstractmethod
    async def create_collection(
        self,
        collection_name: str,
        vector_size: int = 3072,
        distance: str = "Cosine"
    ) -> bool:
        """
        Crea una nueva colección en la base de datos vectorial.
        Args:
            collection_name: Nombre de la colección a crear
            vector_size: Dimensión de los vectores (por defecto 3072)
            distance: Métrica de distancia ("Cosine", "Euclid", "Dot")
        Returns:
            bool: True si se creó exitosamente, False en caso contrario
        """
        pass
    @abstractmethod
    async def delete_collection(self, collection_name: str) -> bool:
        """
        Elimina una colección completa.
        Args:
            collection_name: Nombre de la colección a eliminar
        Returns:
            bool: True si se eliminó exitosamente, False en caso contrario
        """
        pass
    @abstractmethod
    async def file_exists_in_collection(
        self,
        collection_name: str,
        file_name: str
    ) -> bool:
        """
        Verifica si un archivo ya existe en una colección.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo a buscar
        Returns:
            bool: True si el archivo existe, False en caso contrario
        """
        pass
    @abstractmethod
    async def get_chunks_by_file(
        self,
        collection_name: str,
        file_name: str,
        limit: Optional[int] = None
    ) -> List[Dict[str, Any]]:
        """
        Obtiene todos los chunks de un archivo específico.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
            limit: Límite opcional de resultados
        Returns:
            List[Dict]: Lista de chunks con su metadata
        """
        pass
    @abstractmethod
    async def delete_file_from_collection(
        self,
        collection_name: str,
        file_name: str
    ) -> int:
        """
        Elimina todos los chunks de un archivo de una colección.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo a eliminar
        Returns:
            int: Número de chunks eliminados
        """
        pass
    @abstractmethod
    async def add_chunks(
        self,
        collection_name: str,
        chunks: List[Dict[str, Any]]
    ) -> Dict[str, Any]:
        """
        Agrega múltiples chunks a una colección.
        Args:
            collection_name: Nombre de la colección
            chunks: Lista de chunks con estructura:
                {
                    "id": str,
                    "vector": List[float],
                    "payload": {
                        "text": str,
                        "file_name": str,
                        "page": int,
                        ...otros campos opcionales
                    }
                }
        Returns:
            Dict con 'success' (bool) y 'chunks_added' (int)
        """
        pass
    @abstractmethod
    async def get_collection_info(self, collection_name: str) -> Optional[Dict[str, Any]]:
        """
        Obtiene información sobre una colección.
        Args:
            collection_name: Nombre de la colección
        Returns:
            Optional[Dict]: Información de la colección o None si no existe
        """
        pass
    @abstractmethod
    async def count_chunks_in_file(
        self,
        collection_name: str,
        file_name: str
    ) -> int:
        """
        Cuenta el número de chunks de un archivo.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
        Returns:
            int: Número de chunks del archivo
        """
        pass
    @abstractmethod
    async def health_check(self) -> bool:
        """
        Verifica que la conexión con la base de datos vectorial esté funcionando.
        Returns:
            bool: True si la conexión es exitosa, False en caso contrario
        """
        pass
--- a/backend/app/vector_db/factory.py
+++ b/backend/app/vector_db/factory.py
@@ -0,0 +1,76 @@
 """
 Factory para crear instancias de bases de datos vectoriales.
 Este módulo implementa el patrón Factory para crear la instancia correcta
 de base de datos vectorial según la configuración.
 """
 import logging
 from typing import Optional
 from app.core.config import settings
 from .base import VectorDBBase
 from .qdrant_client import QdrantVectorDB
 logger = logging.getLogger(__name__)
 # Instancia global singleton
 _vector_db_instance: Optional[VectorDBBase] = None
 def get_vector_db() -> VectorDBBase:
    """
    Factory function que retorna la instancia de base de datos vectorial configurada.
    Utiliza un patrón Singleton para mantener una sola instancia durante
    el ciclo de vida de la aplicación.
    Returns:
        VectorDBBase: Instancia de la base de datos vectorial configurada
    Raises:
        ValueError: Si el tipo de base de datos no está soportado
    """
    global _vector_db_instance
    # Si ya existe una instancia, retornarla
    if _vector_db_instance is not None:
        return _vector_db_instance
    # Crear nueva instancia según configuración
    db_type = settings.VECTOR_DB_TYPE.lower()
    if db_type == "qdrant":
        logger.info(f"Inicializando Qdrant con URL: {settings.QDRANT_URL}")
        _vector_db_instance = QdrantVectorDB(
            url=settings.QDRANT_URL,
            api_key=settings.QDRANT_API_KEY
        )
    # Aquí se pueden agregar otros proveedores en el futuro
    # elif db_type == "pinecone":
    #     _vector_db_instance = PineconeVectorDB(...)
    # elif db_type == "weaviate":
    #     _vector_db_instance = WeaviateVectorDB(...)
    else:
        raise ValueError(
            f"Tipo de base de datos vectorial no soportado: {db_type}. "
            f"Tipos soportados: qdrant"
        )
    logger.info(f"Base de datos vectorial '{db_type}' inicializada exitosamente")
    return _vector_db_instance
 def reset_vector_db() -> None:
    """
    Resetea la instancia global de la base de datos vectorial.
    NOTA: Esta función solo cierra la conexión del cliente en memoria.
    NO elimina ni modifica datos en Qdrant.
    Útil principalmente para testing.
    """
    global _vector_db_instance
    _vector_db_instance = None
    logger.info("Instancia de base de datos vectorial reseteada")
--- a/backend/app/vector_db/qdrant_client.py
+++ b/backend/app/vector_db/qdrant_client.py
@@ -0,0 +1,410 @@
 """
 Implementación de Qdrant para la interfaz VectorDBBase.
 Este módulo proporciona la implementación concreta de todas las operaciones
 vectoriales utilizando Qdrant como base de datos.
 """
 import logging
 from typing import List, Dict, Any, Optional
 from qdrant_client import QdrantClient
 from qdrant_client.models import (
    Distance,
    VectorParams,
    PointStruct,
    Filter,
    FieldCondition,
    MatchValue
 )
 from qdrant_client.http.exceptions import UnexpectedResponse
 from .base import VectorDBBase
 logger = logging.getLogger(__name__)
 class QdrantVectorDB(VectorDBBase):
    """
    Implementación de VectorDBBase usando Qdrant como proveedor.
    Atributos:
        client: Cliente de Qdrant
        url: URL del servidor Qdrant
        api_key: API key para autenticación
    """
    def __init__(self, url: str, api_key: str):
        """
        Inicializa el cliente de Qdrant.
        Args:
            url: URL del servidor Qdrant
            api_key: API key para autenticación
        """
        self.url = url
        self.api_key = api_key
        self.client = QdrantClient(
            url=url,
            api_key=api_key,
            timeout=30
        )
        logger.info(f"QdrantVectorDB inicializado con URL: {url}")
    async def collection_exists(self, collection_name: str) -> bool:
        """
        Verifica si existe una colección en Qdrant.
        Args:
            collection_name: Nombre de la colección
        Returns:
            bool: True si existe, False en caso contrario
        """
        try:
            collections = self.client.get_collections().collections
            return any(col.name == collection_name for col in collections)
        except Exception as e:
            logger.error(f"Error al verificar colección '{collection_name}': {e}")
            return False
    async def create_collection(
        self,
        collection_name: str,
        vector_size: int = 3072,
        distance: str = "Cosine"
    ) -> bool:
        """
        Crea una nueva colección en Qdrant.
        Args:
            collection_name: Nombre de la colección
            vector_size: Dimensión de los vectores (default: 3072)
            distance: Métrica de distancia
        Returns:
            bool: True si se creó exitosamente
        """
        try:
            # Mapear string a enum de Qdrant
            distance_map = {
                "Cosine": Distance.COSINE,
                "Euclid": Distance.EUCLID,
                "Dot": Distance.DOT
            }
            distance_metric = distance_map.get(distance, Distance.COSINE)
            self.client.create_collection(
                collection_name=collection_name,
                vectors_config=VectorParams(
                    size=vector_size,
                    distance=distance_metric
                )
            )
            logger.info(f"Colección '{collection_name}' creada exitosamente")
            return True
        except Exception as e:
            logger.error(f"Error al crear colección '{collection_name}': {e}")
            return False
    async def delete_collection(self, collection_name: str) -> bool:
        """
        Elimina una colección completa de Qdrant.
        Args:
            collection_name: Nombre de la colección
        Returns:
            bool: True si se eliminó exitosamente
        """
        try:
            self.client.delete_collection(collection_name=collection_name)
            logger.info(f"Colección '{collection_name}' eliminada exitosamente")
            return True
        except Exception as e:
            logger.error(f"Error al eliminar colección '{collection_name}': {e}")
            return False
    async def file_exists_in_collection(
        self,
        collection_name: str,
        file_name: str
    ) -> bool:
        """
        Verifica si un archivo existe en una colección.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
        Returns:
            bool: True si el archivo existe
        """
        try:
            # Buscar un solo punto con el file_name en metadata
            result = self.client.scroll(
                collection_name=collection_name,
                scroll_filter=Filter(
                    must=[
                        FieldCondition(
                            key="metadata.file_name",
                            match=MatchValue(value=file_name)
                        )
                    ]
                ),
                limit=1
            )
            return len(result[0]) > 0
        except Exception as e:
            logger.error(f"Error al verificar archivo '{file_name}' en colección '{collection_name}': {e}")
            return False
    async def get_chunks_by_file(
        self,
        collection_name: str,
        file_name: str,
        limit: Optional[int] = None
    ) -> List[Dict[str, Any]]:
        """
        Obtiene todos los chunks de un archivo.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
            limit: Límite opcional de resultados
        Returns:
            List[Dict]: Lista de chunks con metadata
        """
        try:
            chunks = []
            offset = None
            while True:
                result = self.client.scroll(
                    collection_name=collection_name,
                    scroll_filter=Filter(
                        must=[
                            FieldCondition(
                                key="metadata.file_name",
                                match=MatchValue(value=file_name)
                            )
                        ]
                    ),
                    limit=limit if limit else 100,
                    offset=offset
                )
                points, next_offset = result
                for point in points:
                    chunks.append({
                        "id": str(point.id),
                        "payload": point.payload,
                        "vector": point.vector if hasattr(point, 'vector') else None
                    })
                # Si hay límite y lo alcanzamos, salimos
                if limit and len(chunks) >= limit:
                    break
                # Si no hay más resultados, salimos
                if next_offset is None:
                    break
                offset = next_offset
            logger.info(f"Obtenidos {len(chunks)} chunks del archivo '{file_name}'")
            return chunks
        except Exception as e:
            logger.error(f"Error al obtener chunks del archivo '{file_name}': {e}")
            return []
    async def delete_file_from_collection(
        self,
        collection_name: str,
        file_name: str
    ) -> int:
        """
        Elimina todos los chunks de un archivo.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
        Returns:
            int: Número de chunks eliminados
        """
        try:
            # Primero obtener todos los IDs del archivo
            chunks = await self.get_chunks_by_file(collection_name, file_name)
            if not chunks:
                logger.info(f"No se encontraron chunks para el archivo '{file_name}'")
                return 0
            # Extraer los IDs
            point_ids = [chunk["id"] for chunk in chunks]
            # Eliminar por IDs
            self.client.delete(
                collection_name=collection_name,
                points_selector=point_ids
            )
            logger.info(f"Eliminados {len(point_ids)} chunks del archivo '{file_name}'")
            return len(point_ids)
        except Exception as e:
            logger.error(f"Error al eliminar archivo '{file_name}': {e}")
            return 0
    async def add_chunks(
        self,
        collection_name: str,
        chunks: List[Dict[str, Any]]
    ) -> Dict[str, Any]:
        """
        Agrega múltiples chunks a una colección.
        Args:
            collection_name: Nombre de la colección
            chunks: Lista de chunks con estructura:
                {
                    "id": str,
                    "vector": List[float],
                    "payload": {
                        "page_content": str,
                        "metadata": {
                            "file_name": str,
                            "page": int
                        }
                    }
                }
        Returns:
            Dict con 'success' (bool) y 'chunks_added' (int)
        """
        try:
            points = []
            for chunk in chunks:
                point = PointStruct(
                    id=chunk["id"],
                    vector=chunk["vector"],
                    payload=chunk["payload"]
                )
                points.append(point)
            self.client.upsert(
                collection_name=collection_name,
                points=points
            )
            logger.info(f"Agregados {len(points)} chunks a la colección '{collection_name}'")
            return {
                "success": True,
                "chunks_added": len(points)
            }
        except Exception as e:
            logger.error(f"Error al agregar chunks a '{collection_name}': {e}")
            return {
                "success": False,
                "chunks_added": 0
            }
    async def get_collection_info(self, collection_name: str) -> Optional[Dict[str, Any]]:
        """
        Obtiene información sobre una colección.
        Args:
            collection_name: Nombre de la colección
        Returns:
            Optional[Dict]: Información de la colección o None
        """
        try:
            collection_info = self.client.get_collection(collection_name=collection_name)
            return {
                "name": collection_name,
                "vectors_count": collection_info.points_count,
                "vectors_config": {
                    "size": collection_info.config.params.vectors.size,
                    "distance": collection_info.config.params.vectors.distance.name
                },
                "status": collection_info.status.name
            }
        except UnexpectedResponse as e:
            if e.status_code == 404:
                logger.warning(f"Colección '{collection_name}' no encontrada")
                return None
            logger.error(f"Error al obtener info de colección '{collection_name}': {e}")
            return None
        except Exception as e:
            logger.error(f"Error inesperado al obtener info de colección '{collection_name}': {e}")
            return None
    async def count_chunks_in_file(
        self,
        collection_name: str,
        file_name: str
    ) -> int:
        """
        Cuenta el número de chunks de un archivo.
        Args:
            collection_name: Nombre de la colección
            file_name: Nombre del archivo
        Returns:
            int: Número de chunks
        """
        try:
            result = self.client.scroll(
                collection_name=collection_name,
                scroll_filter=Filter(
                    must=[
                        FieldCondition(
                            key="file_name",
                            match=MatchValue(value=file_name)
                        )
                    ]
                ),
                limit=1,
                with_payload=False,
                with_vectors=False
            )
            # Qdrant scroll no retorna count directo, así que obtenemos todos
            chunks = await self.get_chunks_by_file(collection_name, file_name)
            count = len(chunks)
            logger.info(f"Archivo '{file_name}' tiene {count} chunks")
            return count
        except Exception as e:
            logger.error(f"Error al contar chunks del archivo '{file_name}': {e}")
            return 0
    async def health_check(self) -> bool:
        """
        Verifica la conexión con Qdrant.
        Returns:
            bool: True si la conexión es exitosa
        """
        try:
            self.client.get_collections()
            logger.info("Health check de Qdrant exitoso")
            return True
        except Exception as e:
            logger.error(f"Health check de Qdrant falló: {e}")
            return False
--- a/backend/pyproject.toml
+++ b/backend/pyproject.toml
@@ -12,6 +12,19 @@ dependencies = [
    "python-multipart>=0.0.20",
    "qdrant-client>=1.15.1",
    "uvicorn[standard]>=0.35.0",
    # Chunking & PDF processing
    "pypdf>=5.1.0",
    "pdf2image>=1.17.0",
    "pillow>=11.0.0",
    # LLM & Embeddings
    "openai>=1.59.6",
    "google-cloud-aiplatform>=1.77.0",
    "langchain>=0.3.12",
    "langchain-core>=0.3.24",
    "tiktoken>=0.8.0",
    # WebSockets
    "websockets>=14.1",
    "langchain-text-splitters>=1.0.0",
 ]
 [project.scripts]
 dev = "uvicorn app.main:app --host 0.0.0.0 --port 8000 --reload"
--- a/backend/uv.lock
+++ b/backend/uv.lock
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -11,7 +11,10 @@
        "@radix-ui/react-checkbox": "^1.3.3",
        "@radix-ui/react-dialog": "^1.1.15",
        "@radix-ui/react-label": "^2.1.7",
        "@radix-ui/react-select": "^2.2.6",
        "@radix-ui/react-slot": "^1.2.3",
        "@radix-ui/react-switch": "^1.2.6",
        "@radix-ui/react-tabs": "^1.1.13",
        "class-variance-authority": "^0.7.1",
        "clsx": "^2.1.1",
        "lucide-react": "^0.543.0",
@@ -878,6 +881,44 @@
        "node": "^18.18.0 || ^20.9.0 || >=21.1.0"
      }
    },
    "node_modules/@floating-ui/core": {
      "version": "1.7.3",
      "resolved": "https://registry.npmjs.org/@floating-ui/core/-/core-1.7.3.tgz",
      "integrity": "sha512-sGnvb5dmrJaKEZ+LDIpguvdX3bDlEllmv4/ClQ9awcmCZrlx5jQyyMWFM5kBI+EyNOCDDiKk8il0zeuX3Zlg/w==",
      "license": "MIT",
      "dependencies": {
        "@floating-ui/utils": "^0.2.10"
      }
    },
    "node_modules/@floating-ui/dom": {
      "version": "1.7.4",
      "resolved": "https://registry.npmjs.org/@floating-ui/dom/-/dom-1.7.4.tgz",
      "integrity": "sha512-OOchDgh4F2CchOX94cRVqhvy7b3AFb+/rQXyswmzmGakRfkMgoWVjfnLWkRirfLEfuD4ysVW16eXzwt3jHIzKA==",
      "license": "MIT",
      "dependencies": {
        "@floating-ui/core": "^1.7.3",
        "@floating-ui/utils": "^0.2.10"
      }
    },
    "node_modules/@floating-ui/react-dom": {
      "version": "2.1.6",
      "resolved": "https://registry.npmjs.org/@floating-ui/react-dom/-/react-dom-2.1.6.tgz",
      "integrity": "sha512-4JX6rEatQEvlmgU80wZyq9RT96HZJa88q8hp0pBd+LrczeDI4o6uA2M+uvxngVHo4Ihr8uibXxH6+70zhAFrVw==",
      "license": "MIT",
      "dependencies": {
        "@floating-ui/dom": "^1.7.4"
      },
      "peerDependencies": {
        "react": ">=16.8.0",
        "react-dom": ">=16.8.0"
      }
    },
    "node_modules/@floating-ui/utils": {
      "version": "0.2.10",
      "resolved": "https://registry.npmjs.org/@floating-ui/utils/-/utils-0.2.10.tgz",
      "integrity": "sha512-aGTxbpbg8/b5JfU1HXSrbH3wXZuLPJcNEcZQFMxLs3oSzgtVu6nFPkbbGGUvBcUjKV2YyB9Wxxabo+HEH9tcRQ==",
      "license": "MIT"
    },
    "node_modules/@humanfs/core": {
      "version": "0.19.1",
      "resolved": "https://registry.npmjs.org/@humanfs/core/-/core-0.19.1.tgz",
@@ -1204,12 +1245,41 @@
        "node": ">= 8"
      }
    },
    "node_modules/@radix-ui/number": {
      "version": "1.1.1",
      "resolved": "https://registry.npmjs.org/@radix-ui/number/-/number-1.1.1.tgz",
      "integrity": "sha512-MkKCwxlXTgz6CFoJx3pCwn07GKp36+aZyu/u2Ln2VrA5DcdyCZkASEDBTd8x5whTQQL5CiYf4prXKLcgQdv29g==",
      "license": "MIT"
    },
    "node_modules/@radix-ui/primitive": {
      "version": "1.1.3",
      "resolved": "https://registry.npmjs.org/@radix-ui/primitive/-/primitive-1.1.3.tgz",
      "integrity": "sha512-JTF99U/6XIjCBo0wqkU5sK10glYe27MRRsfwoiq5zzOEZLHU3A3KCMa5X/azekYRCJ0HlwI0crAXS/5dEHTzDg==",
      "license": "MIT"
    },
    "node_modules/@radix-ui/react-arrow": {
      "version": "1.1.7",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-arrow/-/react-arrow-1.1.7.tgz",
      "integrity": "sha512-F+M1tLhO+mlQaOWspE8Wstg+z6PwxwRd8oQ8IXceWz92kfAmalTRf0EjrouQeo7QssEPfCn05B4Ihs1K9WQ/7w==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/react-primitive": "2.1.3"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-checkbox": {
      "version": "1.3.3",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-checkbox/-/react-checkbox-1.3.3.tgz",
@@ -1240,6 +1310,32 @@
        }
      }
    },
    "node_modules/@radix-ui/react-collection": {
      "version": "1.1.7",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-collection/-/react-collection-1.1.7.tgz",
      "integrity": "sha512-Fh9rGN0MoI4ZFUNyfFVNU4y9LUz93u9/0K+yLgA2bwRojxM8JU1DyvvMBabnZPBgMWREAJvU2jjVzq+LrFUglw==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/react-compose-refs": "1.1.2",
        "@radix-ui/react-context": "1.1.2",
        "@radix-ui/react-primitive": "2.1.3",
        "@radix-ui/react-slot": "1.2.3"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-compose-refs": {
      "version": "1.1.2",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-compose-refs/-/react-compose-refs-1.1.2.tgz",
@@ -1305,6 +1401,21 @@
        }
      }
    },
    "node_modules/@radix-ui/react-direction": {
      "version": "1.1.1",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-direction/-/react-direction-1.1.1.tgz",
      "integrity": "sha512-1UEWRX6jnOA2y4H5WczZ44gOOjTEmlqv1uNW4GAJEO5+bauCBhv8snY65Iw5/VOS/ghKN9gr2KjnLKxrsvoMVw==",
      "license": "MIT",
      "peerDependencies": {
        "@types/react": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-dismissable-layer": {
      "version": "1.1.11",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-dismissable-layer/-/react-dismissable-layer-1.1.11.tgz",
@@ -1413,6 +1524,38 @@
        }
      }
    },
    "node_modules/@radix-ui/react-popper": {
      "version": "1.2.8",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-popper/-/react-popper-1.2.8.tgz",
      "integrity": "sha512-0NJQ4LFFUuWkE7Oxf0htBKS6zLkkjBH+hM1uk7Ng705ReR8m/uelduy1DBo0PyBXPKVnBA6YBlU94MBGXrSBCw==",
      "license": "MIT",
      "dependencies": {
        "@floating-ui/react-dom": "^2.0.0",
        "@radix-ui/react-arrow": "1.1.7",
        "@radix-ui/react-compose-refs": "1.1.2",
        "@radix-ui/react-context": "1.1.2",
        "@radix-ui/react-primitive": "2.1.3",
        "@radix-ui/react-use-callback-ref": "1.1.1",
        "@radix-ui/react-use-layout-effect": "1.1.1",
        "@radix-ui/react-use-rect": "1.1.1",
        "@radix-ui/react-use-size": "1.1.1",
        "@radix-ui/rect": "1.1.1"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-portal": {
      "version": "1.1.9",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-portal/-/react-portal-1.1.9.tgz",
@@ -1484,6 +1627,80 @@
        }
      }
    },
    "node_modules/@radix-ui/react-roving-focus": {
      "version": "1.1.11",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-roving-focus/-/react-roving-focus-1.1.11.tgz",
      "integrity": "sha512-7A6S9jSgm/S+7MdtNDSb+IU859vQqJ/QAtcYQcfFC6W8RS4IxIZDldLR0xqCFZ6DCyrQLjLPsxtTNch5jVA4lA==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/primitive": "1.1.3",
        "@radix-ui/react-collection": "1.1.7",
        "@radix-ui/react-compose-refs": "1.1.2",
        "@radix-ui/react-context": "1.1.2",
        "@radix-ui/react-direction": "1.1.1",
        "@radix-ui/react-id": "1.1.1",
        "@radix-ui/react-primitive": "2.1.3",
        "@radix-ui/react-use-callback-ref": "1.1.1",
        "@radix-ui/react-use-controllable-state": "1.2.2"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-select": {
      "version": "2.2.6",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-select/-/react-select-2.2.6.tgz",
      "integrity": "sha512-I30RydO+bnn2PQztvo25tswPH+wFBjehVGtmagkU78yMdwTwVf12wnAOF+AeP8S2N8xD+5UPbGhkUfPyvT+mwQ==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/number": "1.1.1",
        "@radix-ui/primitive": "1.1.3",
        "@radix-ui/react-collection": "1.1.7",
        "@radix-ui/react-compose-refs": "1.1.2",
        "@radix-ui/react-context": "1.1.2",
        "@radix-ui/react-direction": "1.1.1",
        "@radix-ui/react-dismissable-layer": "1.1.11",
        "@radix-ui/react-focus-guards": "1.1.3",
        "@radix-ui/react-focus-scope": "1.1.7",
        "@radix-ui/react-id": "1.1.1",
        "@radix-ui/react-popper": "1.2.8",
        "@radix-ui/react-portal": "1.1.9",
        "@radix-ui/react-primitive": "2.1.3",
        "@radix-ui/react-slot": "1.2.3",
        "@radix-ui/react-use-callback-ref": "1.1.1",
        "@radix-ui/react-use-controllable-state": "1.2.2",
        "@radix-ui/react-use-layout-effect": "1.1.1",
        "@radix-ui/react-use-previous": "1.1.1",
        "@radix-ui/react-visually-hidden": "1.2.3",
        "aria-hidden": "^1.2.4",
        "react-remove-scroll": "^2.6.3"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-slot": {
      "version": "1.2.3",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-slot/-/react-slot-1.2.3.tgz",
@@ -1502,6 +1719,65 @@
        }
      }
    },
    "node_modules/@radix-ui/react-switch": {
      "version": "1.2.6",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-switch/-/react-switch-1.2.6.tgz",
      "integrity": "sha512-bByzr1+ep1zk4VubeEVViV592vu2lHE2BZY5OnzehZqOOgogN80+mNtCqPkhn2gklJqOpxWgPoYTSnhBCqpOXQ==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/primitive": "1.1.3",
        "@radix-ui/react-compose-refs": "1.1.2",
        "@radix-ui/react-context": "1.1.2",
        "@radix-ui/react-primitive": "2.1.3",
        "@radix-ui/react-use-controllable-state": "1.2.2",
        "@radix-ui/react-use-previous": "1.1.1",
        "@radix-ui/react-use-size": "1.1.1"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-tabs": {
      "version": "1.1.13",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-tabs/-/react-tabs-1.1.13.tgz",
      "integrity": "sha512-7xdcatg7/U+7+Udyoj2zodtI9H/IIopqo+YOIcZOq1nJwXWBZ9p8xiu5llXlekDbZkca79a/fozEYQXIA4sW6A==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/primitive": "1.1.3",
        "@radix-ui/react-context": "1.1.2",
        "@radix-ui/react-direction": "1.1.1",
        "@radix-ui/react-id": "1.1.1",
        "@radix-ui/react-presence": "1.1.5",
        "@radix-ui/react-primitive": "2.1.3",
        "@radix-ui/react-roving-focus": "1.1.11",
        "@radix-ui/react-use-controllable-state": "1.2.2"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-use-callback-ref": {
      "version": "1.1.1",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-use-callback-ref/-/react-use-callback-ref-1.1.1.tgz",
@@ -1602,6 +1878,24 @@
        }
      }
    },
    "node_modules/@radix-ui/react-use-rect": {
      "version": "1.1.1",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-use-rect/-/react-use-rect-1.1.1.tgz",
      "integrity": "sha512-QTYuDesS0VtuHNNvMh+CjlKJ4LJickCMUAqjlE3+j8w+RlRpwyX3apEQKGFzbZGdo7XNG1tXa+bQqIE7HIXT2w==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/rect": "1.1.1"
      },
      "peerDependencies": {
        "@types/react": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/react-use-size": {
      "version": "1.1.1",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-use-size/-/react-use-size-1.1.1.tgz",
@@ -1620,6 +1914,35 @@
        }
      }
    },
    "node_modules/@radix-ui/react-visually-hidden": {
      "version": "1.2.3",
      "resolved": "https://registry.npmjs.org/@radix-ui/react-visually-hidden/-/react-visually-hidden-1.2.3.tgz",
      "integrity": "sha512-pzJq12tEaaIhqjbzpCuv/OypJY/BPavOofm+dbab+MHLajy277+1lLm6JFcGgF5eskJ6mquGirhXY2GD/8u8Ug==",
      "license": "MIT",
      "dependencies": {
        "@radix-ui/react-primitive": "2.1.3"
      },
      "peerDependencies": {
        "@types/react": "*",
        "@types/react-dom": "*",
        "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc",
        "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc"
      },
      "peerDependenciesMeta": {
        "@types/react": {
          "optional": true
        },
        "@types/react-dom": {
          "optional": true
        }
      }
    },
    "node_modules/@radix-ui/rect": {
      "version": "1.1.1",
      "resolved": "https://registry.npmjs.org/@radix-ui/rect/-/rect-1.1.1.tgz",
      "integrity": "sha512-HPwpGIzkl28mWyZqG52jiqDJ12waP11Pa1lGoiyUkIEuMLBP0oeK/C89esbXrxsky5we7dfd8U58nm0SgAWpVw==",
      "license": "MIT"
    },
    "node_modules/@rolldown/pluginutils": {
      "version": "1.0.0-beta.34",
      "resolved": "https://registry.npmjs.org/@rolldown/pluginutils/-/pluginutils-1.0.0-beta.34.tgz",
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -13,7 +13,10 @@
    "@radix-ui/react-checkbox": "^1.3.3",
    "@radix-ui/react-dialog": "^1.1.15",
    "@radix-ui/react-label": "^2.1.7",
    "@radix-ui/react-select": "^2.2.6",
    "@radix-ui/react-slot": "^1.2.3",
    "@radix-ui/react-switch": "^1.2.6",
    "@radix-ui/react-tabs": "^1.1.13",
    "class-variance-authority": "^0.7.1",
    "clsx": "^2.1.1",
    "lucide-react": "^0.543.0",
--- a/frontend/src/components/ChunkPreviewPanel.tsx
+++ b/frontend/src/components/ChunkPreviewPanel.tsx
@@ -0,0 +1,228 @@
 import { useState, useEffect } from 'react'
 import { api } from '../services/api'
 import {
  Dialog,
  DialogContent,
  DialogDescription,
  DialogFooter,
  DialogHeader,
  DialogTitle,
 } from './ui/dialog'
 import { Button } from './ui/button'
 import { AlertCircle, Loader2, FileText, CheckCircle2, XCircle } from 'lucide-react'
 import type { ChunkingConfig } from './ChunkingConfigModal'
 interface ChunkPreviewPanelProps {
  isOpen: boolean
  onClose: () => void
  config: ChunkingConfig | null
  onAccept: (config: ChunkingConfig) => void
  onCancel: () => void
 }
 interface PreviewChunk {
  index: number
  text: string
  page: number
  file_name: string
  tokens: number
 }
 export function ChunkPreviewPanel({
  isOpen,
  onClose,
  config,
  onAccept,
  onCancel,
 }: ChunkPreviewPanelProps) {
  const [chunks, setChunks] = useState<PreviewChunk[]>([])
  const [loading, setLoading] = useState(false)
  const [processing, setProcessing] = useState(false)
  const [error, setError] = useState<string | null>(null)
  const [success, setSuccess] = useState(false)
  // Auto-cargar preview cuando se abre el modal
  useEffect(() => {
    if (isOpen && config && chunks.length === 0) {
      loadPreview()
    }
  }, [isOpen, config])
  const loadPreview = async () => {
    if (!config) return
    setLoading(true)
    setError(null)
    setSuccess(false)
    try {
      const result = await api.generateChunkPreview(config)
      setChunks(result.chunks)
    } catch (err) {
      console.error('Error loading preview:', err)
      setError(err instanceof Error ? err.message : 'Error generando preview')
    } finally {
      setLoading(false)
    }
  }
  const handleAccept = async () => {
    if (!config) return
    setProcessing(true)
    setError(null)
    try {
      await onAccept(config)
      setSuccess(true)
      // Cerrar después de 2 segundos
      setTimeout(() => {
        handleClose()
      }, 2000)
    } catch (err) {
      console.error('Error processing:', err)
      setError(err instanceof Error ? err.message : 'Error procesando PDF')
    } finally {
      setProcessing(false)
    }
  }
  const handleCancel = () => {
    onCancel()
    handleClose()
  }
  const handleClose = () => {
    setChunks([])
    setError(null)
    setSuccess(false)
    onClose()
  }
  if (!config) return null
  return (
    <Dialog open={isOpen} onOpenChange={handleClose}>
      <DialogContent className="max-w-4xl max-h-[85vh] flex flex-col">
        <DialogHeader>
          <DialogTitle className="flex items-center gap-2">
            <FileText className="w-5 h-5" />
            Preview de Chunks
          </DialogTitle>
          <DialogDescription>
            Vista previa de chunks para <strong>{config.file_name}</strong>
          </DialogDescription>
        </DialogHeader>
        {/* Contenido */}
        <div className="flex-1 overflow-y-auto">
          {loading ? (
            <div className="flex items-center justify-center py-12">
              <Loader2 className="w-8 h-8 animate-spin text-gray-400" />
              <span className="ml-2 text-gray-500">Generando preview...</span>
            </div>
          ) : error ? (
            <div className="flex items-center gap-2 text-sm text-red-600 bg-red-50 p-4 rounded">
              <AlertCircle className="w-5 h-5" />
              <span>{error}</span>
            </div>
          ) : success ? (
            <div className="flex flex-col items-center justify-center py-12 text-center">
              <CheckCircle2 className="w-16 h-16 text-green-500 mb-4" />
              <h3 className="text-lg font-semibold text-green-700">
                Procesamiento Completado
              </h3>
              <p className="text-sm text-gray-600 mt-2">
                El PDF ha sido procesado y subido a Qdrant exitosamente
              </p>
            </div>
          ) : chunks.length === 0 ? (
            <div className="text-center py-12 text-gray-500">
              <FileText className="w-12 h-12 mx-auto mb-2 text-gray-300" />
              <p>No hay chunks para mostrar</p>
            </div>
          ) : (
            <div className="space-y-4">
              {/* Información de configuración */}
              <div className="bg-blue-50 p-3 rounded">
                <p className="text-sm text-blue-800">
                  <strong>Configuración:</strong> Max {config.max_tokens} tokens, Target{' '}
                  {config.target_tokens} tokens
                  {config.use_llm && ' | LLM Habilitado'}
                </p>
              </div>
              {/* Lista de chunks */}
              {chunks.map((chunk) => (
                <div key={chunk.index} className="border rounded-lg p-4 space-y-2">
                  {/* Header del chunk */}
                  <div className="flex items-start justify-between">
                    <div className="flex items-center gap-2">
                      <span className="text-sm font-semibold text-gray-700">
                        Chunk #{chunk.index + 1}
                      </span>
                      <span className="text-xs text-gray-500 bg-gray-100 px-2 py-1 rounded">
                        Página {chunk.page}
                      </span>
                      <span className="text-xs text-blue-600 bg-blue-100 px-2 py-1 rounded">
                        ~{chunk.tokens} tokens
                      </span>
                    </div>
                  </div>
                  {/* Texto del chunk */}
                  <div className="bg-gray-50 p-3 rounded text-sm">
                    <p className="text-gray-700 whitespace-pre-wrap leading-relaxed">
                      {chunk.text}
                    </p>
                  </div>
                  {/* Indicador de longitud */}
                  <div className="text-xs text-gray-500">
                    Longitud: {chunk.text.length} caracteres
                  </div>
                </div>
              ))}
              {/* Información adicional */}
              <div className="bg-yellow-50 border border-yellow-200 p-3 rounded">
                <p className="text-sm text-yellow-800">
                  <strong>Nota:</strong> Estos son chunks de ejemplo (hasta 3). El documento
                  completo generará más chunks según su tamaño.
                </p>
              </div>
            </div>
          )}
        </div>
        {/* Footer con acciones */}
        <DialogFooter className="flex justify-between items-center pt-4 border-t">
          <Button
            variant="outline"
            onClick={handleCancel}
            disabled={processing || success}
            className="text-red-600 hover:text-red-700 hover:bg-red-50"
          >
            <XCircle className="w-4 h-4 mr-2" />
            Cancelar
          </Button>
          <Button onClick={handleAccept} disabled={processing || loading || chunks.length === 0 || success}>
            {processing ? (
              <>
                <Loader2 className="w-4 h-4 mr-2 animate-spin" />
                Procesando...
              </>
            ) : (
              <>
                <CheckCircle2 className="w-4 h-4 mr-2" />
                Aceptar y Procesar
              </>
            )}
          </Button>
        </DialogFooter>
      </DialogContent>
    </Dialog>
  )
 }
--- a/frontend/src/components/ChunkViewerModal.tsx
+++ b/frontend/src/components/ChunkViewerModal.tsx
@@ -0,0 +1,205 @@
 import { useEffect, useState } from 'react'
 import { api } from '../services/api'
 import {
  Dialog,
  DialogContent,
  DialogDescription,
  DialogHeader,
  DialogTitle,
 } from './ui/dialog'
 import { Button } from './ui/button'
 import { AlertCircle, Loader2, FileText, Trash2 } from 'lucide-react'
 interface ChunkViewerModalProps {
  isOpen: boolean
  onClose: () => void
  fileName: string
  tema: string
 }
 interface Chunk {
  id: string
  payload: {
    page_content: string
    metadata: {
      file_name: string
      page: number
      [key: string]: any
    }
    [key: string]: any
  }
  vector?: number[]
 }
 export function ChunkViewerModal({ isOpen, onClose, fileName, tema }: ChunkViewerModalProps) {
  const [chunks, setChunks] = useState<Chunk[]>([])
  const [loading, setLoading] = useState(false)
  const [error, setError] = useState<string | null>(null)
  const [deleting, setDeleting] = useState(false)
  useEffect(() => {
    if (isOpen && fileName && tema) {
      loadChunks()
    }
  }, [isOpen, fileName, tema])
  const loadChunks = async () => {
    setLoading(true)
    setError(null)
    try {
      const result = await api.getChunksByFile(tema, fileName)
      setChunks(result.chunks)
    } catch (err) {
      console.error('Error loading chunks:', err)
      setError(err instanceof Error ? err.message : 'Error al cargar chunks')
    } finally {
      setLoading(false)
    }
  }
  const handleDeleteFile = async () => {
    if (!confirm(`¿Estás seguro de eliminar todos los chunks del archivo "${fileName}" de la colección "${tema}"?`)) {
      return
    }
    setDeleting(true)
    setError(null)
    try {
      await api.deleteFileFromCollection(tema, fileName)
      alert('Archivo eliminado de la colección exitosamente')
      onClose()
    } catch (err) {
      console.error('Error deleting file from collection:', err)
      setError(err instanceof Error ? err.message : 'Error al eliminar archivo')
    } finally {
      setDeleting(false)
    }
  }
  const handleClose = () => {
    setChunks([])
    setError(null)
    onClose()
  }
  return (
    <Dialog open={isOpen} onOpenChange={handleClose}>
      <DialogContent className="max-w-4xl max-h-[80vh] flex flex-col">
        <DialogHeader>
          <DialogTitle className="flex items-center gap-2">
            <FileText className="w-5 h-5" />
            Chunks de "{fileName}"
          </DialogTitle>
          <DialogDescription>
            Colección: <strong>{tema}</strong>
          </DialogDescription>
        </DialogHeader>
        {/* Contenido */}
        <div className="flex-1 overflow-y-auto">
          {loading ? (
            <div className="flex items-center justify-center py-8">
              <Loader2 className="w-8 h-8 animate-spin text-gray-400" />
              <span className="ml-2 text-gray-500">Cargando chunks...</span>
            </div>
          ) : error ? (
            <div className="flex items-center gap-2 text-sm text-red-600 bg-red-50 p-4 rounded">
              <AlertCircle className="w-5 h-5" />
              <span>{error}</span>
            </div>
          ) : chunks.length === 0 ? (
            <div className="text-center py-8 text-gray-500">
              <FileText className="w-12 h-12 mx-auto mb-2 text-gray-300" />
              <p>No se encontraron chunks para este archivo.</p>
              <p className="text-sm mt-1">El archivo aún no ha sido procesado o no existe en la colección.</p>
            </div>
          ) : (
            <div className="space-y-4">
              {/* Estadísticas */}
              <div className="bg-blue-50 p-3 rounded">
                <p className="text-sm text-blue-800">
                  <strong>Total de chunks:</strong> {chunks.length}
                </p>
              </div>
              {/* Lista de chunks */}
              {chunks.map((chunk, index) => (
                <div key={chunk.id} className="border rounded-lg p-4 space-y-2">
                  {/* Header del chunk */}
                  <div className="flex items-start justify-between">
                    <div className="flex items-center gap-2">
                      <span className="text-sm font-semibold text-gray-700">
                        Chunk #{index + 1}
                      </span>
                      <span className="text-xs text-gray-500">
                        Página {chunk.payload.metadata.page}
                      </span>
                    </div>
                    <span className="text-xs text-gray-400 font-mono">
                      ID: {chunk.id.substring(0, 8)}...
                    </span>
                  </div>
                  {/* Texto del chunk */}
                  {chunk.payload.page_content && (
                    <div className="bg-gray-50 p-3 rounded text-sm">
                      <p className="text-gray-700 whitespace-pre-wrap">
                        {chunk.payload.page_content}
                      </p>
                      <div className="mt-2 text-xs text-gray-500">
                        <strong>Caracteres:</strong> {chunk.payload.page_content.length}
                      </div>
                    </div>
                  )}
                  {/* Metadata */}
                  <div className="text-xs text-gray-500">
                    <strong>Metadata:</strong>
                    <pre className="mt-1 bg-gray-100 p-2 rounded overflow-x-auto">
                      {JSON.stringify(chunk.payload.metadata, null, 2)}
                    </pre>
                  </div>
                  {/* Información del vector (opcional) */}
                  {chunk.vector && (
                    <div className="text-xs text-gray-400">
                      Vector dimension: {chunk.vector.length}
                    </div>
                  )}
                </div>
              ))}
            </div>
          )}
        </div>
        {/* Footer con acciones */}
        <div className="flex justify-between items-center pt-4 border-t">
          <Button
            variant="outline"
            onClick={handleDeleteFile}
            disabled={deleting || chunks.length === 0}
            className="text-red-600 hover:text-red-700 hover:bg-red-50"
          >
            {deleting ? (
              <>
                <Loader2 className="w-4 h-4 mr-2 animate-spin" />
                Eliminando...
              </>
            ) : (
              <>
                <Trash2 className="w-4 h-4 mr-2" />
                Eliminar de colección
              </>
            )}
          </Button>
          <Button onClick={handleClose}>
            Cerrar
          </Button>
        </div>
      </DialogContent>
    </Dialog>
  )
 }
--- a/frontend/src/components/ChunkingConfigModal.tsx
+++ b/frontend/src/components/ChunkingConfigModal.tsx
@@ -0,0 +1,307 @@
 import { useEffect, useState } from 'react'
 import { api } from '../services/api'
 import {
  Dialog,
  DialogContent,
  DialogDescription,
  DialogFooter,
  DialogHeader,
  DialogTitle,
 } from './ui/dialog'
 import { Button } from './ui/button'
 import { Label } from './ui/label'
 import { Input } from './ui/input'
 import { Textarea } from './ui/textarea'
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from './ui/select'
 import { Switch } from './ui/switch'
 import { AlertCircle, Loader2, Settings, Sparkles } from 'lucide-react'
 import { Tabs, TabsContent, TabsList, TabsTrigger } from './ui/tabs'
 interface ChunkingConfigModalProps {
  isOpen: boolean
  onClose: () => void
  fileName: string
  tema: string
  collectionName: string
  onPreview: (config: ChunkingConfig) => void
 }
 export interface ChunkingConfig {
  file_name: string
  tema: string
  collection_name: string
  max_tokens: number
  target_tokens: number
  chunk_size: number
  chunk_overlap: number
  use_llm: boolean
  custom_instructions: string
 }
 interface ChunkingProfile {
  id: string
  name: string
  description: string
  max_tokens: number
  target_tokens: number
  chunk_size: number
  chunk_overlap: number
  use_llm: boolean
 }
 export function ChunkingConfigModal({
  isOpen,
  onClose,
  fileName,
  tema,
  collectionName,
  onPreview,
 }: ChunkingConfigModalProps) {
  const [profiles, setProfiles] = useState<ChunkingProfile[]>([])
  const [selectedProfile, setSelectedProfile] = useState<string>('balanced')
  const [loading, setLoading] = useState(false)
  const [error, setError] = useState<string | null>(null)
  // Custom configuration
  const [maxTokens, setMaxTokens] = useState(950)
  const [targetTokens, setTargetTokens] = useState(800)
  const [chunkSize, setChunkSize] = useState(1000)
  const [chunkOverlap, setChunkOverlap] = useState(200)
  const [useLLM, setUseLLM] = useState(true)
  const [customInstructions, setCustomInstructions] = useState('')
  useEffect(() => {
    if (isOpen) {
      loadProfiles()
    }
  }, [isOpen])
  const loadProfiles = async () => {
    setLoading(true)
    setError(null)
    try {
      const result = await api.getChunkingProfiles()
      setProfiles(result.profiles)
    } catch (err) {
      console.error('Error loading profiles:', err)
      setError(err instanceof Error ? err.message : 'Error cargando perfiles')
    } finally {
      setLoading(false)
    }
  }
  const handleProfileChange = (profileId: string) => {
    setSelectedProfile(profileId)
    const profile = profiles.find((p) => p.id === profileId)
    if (profile) {
      setMaxTokens(profile.max_tokens)
      setTargetTokens(profile.target_tokens)
      setChunkSize(profile.chunk_size)
      setChunkOverlap(profile.chunk_overlap)
      setUseLLM(profile.use_llm)
    }
  }
  const handlePreview = () => {
    const config: ChunkingConfig = {
      file_name: fileName,
      tema: tema,
      collection_name: collectionName,
      max_tokens: maxTokens,
      target_tokens: targetTokens,
      chunk_size: chunkSize,
      chunk_overlap: chunkOverlap,
      use_llm: useLLM,
      custom_instructions: useLLM ? customInstructions : '',
    }
    onPreview(config)
  }
  const handleClose = () => {
    setError(null)
    onClose()
  }
  return (
    <Dialog open={isOpen} onOpenChange={handleClose}>
      <DialogContent className="max-w-2xl max-h-[90vh] flex flex-col">
        <DialogHeader>
          <DialogTitle className="flex items-center gap-2">
            <Settings className="w-5 h-5" />
            Configurar Chunking
          </DialogTitle>
          <DialogDescription>
            Configura cómo se procesará el archivo <strong>{fileName}</strong>
          </DialogDescription>
        </DialogHeader>
        {loading ? (
          <div className="flex items-center justify-center py-8">
            <Loader2 className="w-8 h-8 animate-spin text-gray-400" />
            <span className="ml-2 text-gray-500">Cargando perfiles...</span>
          </div>
        ) : error ? (
          <div className="flex items-center gap-2 text-sm text-red-600 bg-red-50 p-4 rounded">
            <AlertCircle className="w-5 h-5" />
            <span>{error}</span>
          </div>
        ) : (
          <Tabs defaultValue="profiles" className="flex-1">
            <TabsList className="grid w-full grid-cols-2">
              <TabsTrigger value="profiles">Perfiles</TabsTrigger>
              <TabsTrigger value="custom">Personalizado</TabsTrigger>
            </TabsList>
            {/* Tab de Perfiles */}
            <TabsContent value="profiles" className="space-y-4">
              <div className="space-y-2">
                <Label>Perfil de Configuración</Label>
                <Select value={selectedProfile} onValueChange={handleProfileChange}>
                  <SelectTrigger>
                    <SelectValue placeholder="Selecciona un perfil" />
                  </SelectTrigger>
                  <SelectContent>
                    {profiles.map((profile) => (
                      <SelectItem key={profile.id} value={profile.id}>
                        <div className="flex flex-col">
                          <span className="font-medium">{profile.name}</span>
                          <span className="text-xs text-gray-500">{profile.description}</span>
                        </div>
                      </SelectItem>
                    ))}
                  </SelectContent>
                </Select>
              </div>
              {/* Mostrar detalles del perfil seleccionado */}
              {selectedProfile && (
                <div className="bg-gray-50 p-4 rounded-lg space-y-2 text-sm">
                  <div className="grid grid-cols-2 gap-2">
                    <div>
                      <span className="font-medium">Max Tokens:</span> {maxTokens}
                    </div>
                    <div>
                      <span className="font-medium">Target Tokens:</span> {targetTokens}
                    </div>
                    <div>
                      <span className="font-medium">Chunk Size:</span> {chunkSize}
                    </div>
                    <div>
                      <span className="font-medium">Overlap:</span> {chunkOverlap}
                    </div>
                    <div className="col-span-2">
                      <span className="font-medium">LLM:</span>{' '}
                      {useLLM ? '✅ Habilitado' : '❌ Deshabilitado'}
                    </div>
                  </div>
                </div>
              )}
            </TabsContent>
            {/* Tab Personalizado */}
            <TabsContent value="custom" className="space-y-4 overflow-y-auto max-h-[50vh]">
              <div className="grid grid-cols-2 gap-4">
                <div className="space-y-2">
                  <Label htmlFor="maxTokens">Max Tokens</Label>
                  <Input
                    id="maxTokens"
                    type="number"
                    min={100}
                    max={2000}
                    value={maxTokens}
                    onChange={(e) => setMaxTokens(Number(e.target.value))}
                  />
                </div>
                <div className="space-y-2">
                  <Label htmlFor="targetTokens">Target Tokens</Label>
                  <Input
                    id="targetTokens"
                    type="number"
                    min={100}
                    max={2000}
                    value={targetTokens}
                    onChange={(e) => setTargetTokens(Number(e.target.value))}
                  />
                </div>
                <div className="space-y-2">
                  <Label htmlFor="chunkSize">Chunk Size</Label>
                  <Input
                    id="chunkSize"
                    type="number"
                    min={100}
                    max={3000}
                    value={chunkSize}
                    onChange={(e) => setChunkSize(Number(e.target.value))}
                  />
                </div>
                <div className="space-y-2">
                  <Label htmlFor="chunkOverlap">Chunk Overlap</Label>
                  <Input
                    id="chunkOverlap"
                    type="number"
                    min={0}
                    max={1000}
                    value={chunkOverlap}
                    onChange={(e) => setChunkOverlap(Number(e.target.value))}
                  />
                </div>
              </div>
              {/* Toggle LLM */}
              <div className="flex items-center justify-between p-4 bg-blue-50 rounded-lg">
                <div className="flex items-center gap-2">
                  <Sparkles className="w-5 h-5 text-blue-600" />
                  <div>
                    <Label htmlFor="useLLM" className="font-medium cursor-pointer">
                      Usar LLM (Gemini)
                    </Label>
                    <p className="text-xs text-gray-600">
                      Procesamiento inteligente con IA
                    </p>
                  </div>
                </div>
                <Switch
                  id="useLLM"
                  checked={useLLM}
                  onCheckedChange={setUseLLM}
                />
              </div>
              {/* Custom Instructions (solo si LLM está habilitado) */}
              {useLLM && (
                <div className="space-y-2">
                  <Label htmlFor="customInstructions">
                    Instrucciones Personalizadas (Opcional)
                  </Label>
                  <Textarea
                    id="customInstructions"
                    placeholder="Ej: Mantén todos los términos técnicos en inglés..."
                    value={customInstructions}
                    onChange={(e) => setCustomInstructions(e.target.value)}
                    rows={3}
                  />
                  <p className="text-xs text-gray-500">
                    Instrucciones adicionales para guiar el procesamiento con IA
                  </p>
                </div>
              )}
            </TabsContent>
          </Tabs>
        )}
        <DialogFooter className="flex justify-between items-center pt-4 border-t">
          <Button variant="outline" onClick={handleClose}>
            Cancelar
          </Button>
          <Button onClick={handlePreview} disabled={loading}>
            Generar Preview
          </Button>
        </DialogFooter>
      </DialogContent>
    </Dialog>
  )
 }
--- a/frontend/src/components/CollectionVerifier.tsx
+++ b/frontend/src/components/CollectionVerifier.tsx
@@ -0,0 +1,164 @@
 import { useEffect, useState } from 'react'
 import { api } from '../services/api'
 import {
  Dialog,
  DialogContent,
  DialogDescription,
  DialogFooter,
  DialogHeader,
  DialogTitle,
 } from './ui/dialog'
 import { Button } from './ui/button'
 import { AlertCircle, CheckCircle2, Loader2 } from 'lucide-react'
 interface CollectionVerifierProps {
  tema: string | null
  onVerified?: (exists: boolean) => void
 }
 export function CollectionVerifier({ tema, onVerified }: CollectionVerifierProps) {
  const [isChecking, setIsChecking] = useState(false)
  const [collectionExists, setCollectionExists] = useState<boolean | null>(null)
  const [showCreateDialog, setShowCreateDialog] = useState(false)
  const [isCreating, setIsCreating] = useState(false)
  const [error, setError] = useState<string | null>(null)
  useEffect(() => {
    if (tema) {
      checkCollection()
    } else {
      setCollectionExists(null)
    }
  }, [tema])
  const checkCollection = async () => {
    if (!tema) return
    setIsChecking(true)
    setError(null)
    try {
      const result = await api.checkCollectionExists(tema)
      setCollectionExists(result.exists)
      // Si no existe, mostrar el diálogo de confirmación
      if (!result.exists) {
        setShowCreateDialog(true)
      }
      onVerified?.(result.exists)
    } catch (err) {
      console.error('Error checking collection:', err)
      setError(err instanceof Error ? err.message : 'Error al verificar colección')
      setCollectionExists(null)
    } finally {
      setIsChecking(false)
    }
  }
  const handleCreateCollection = async () => {
    if (!tema) return
    setIsCreating(true)
    setError(null)
    try {
      const result = await api.createCollection(tema)
      if (result.success) {
        setCollectionExists(true)
        setShowCreateDialog(false)
        onVerified?.(true)
      }
    } catch (err) {
      console.error('Error creating collection:', err)
      setError(err instanceof Error ? err.message : 'Error al crear colección')
    } finally {
      setIsCreating(false)
    }
  }
  const handleCancelCreate = () => {
    setShowCreateDialog(false)
    // Opcionalmente podemos notificar que no se creó la colección
    onVerified?.(false)
  }
  // No renderizar nada si no hay tema seleccionado
  if (!tema) {
    return null
  }
  return (
    <>
      {/* Indicador de estado de la colección */}
      {isChecking ? (
        <div className="flex items-center gap-2 text-sm text-gray-500 mb-4">
          <Loader2 className="w-4 h-4 animate-spin" />
          <span>Verificando colección...</span>
        </div>
      ) : collectionExists === true ? (
        <div className="flex items-center gap-2 text-sm text-green-600 mb-4">
          <CheckCircle2 className="w-4 h-4" />
          <span>Colección "{tema}" disponible en Qdrant</span>
        </div>
      ) : collectionExists === false ? (
        <div className="flex items-center gap-2 text-sm text-yellow-600 mb-4">
          <AlertCircle className="w-4 h-4" />
          <span>Colección "{tema}" no existe en Qdrant</span>
        </div>
      ) : error ? (
        <div className="flex items-center gap-2 text-sm text-red-600 mb-4">
          <AlertCircle className="w-4 h-4" />
          <span>{error}</span>
        </div>
      ) : null}
      {/* Diálogo de confirmación para crear colección */}
      <Dialog open={showCreateDialog} onOpenChange={setShowCreateDialog}>
        <DialogContent>
          <DialogHeader>
            <DialogTitle>Crear colección en Qdrant</DialogTitle>
            <DialogDescription>
              La colección "<strong>{tema}</strong>" no existe en la base de datos vectorial.
              <br />
              <br />
              ¿Deseas crear esta colección ahora? Esto permitirá almacenar y buscar chunks de
              documentos para este tema.
            </DialogDescription>
          </DialogHeader>
          {error && (
            <div className="flex items-center gap-2 text-sm text-red-600 bg-red-50 p-3 rounded">
              <AlertCircle className="w-4 h-4" />
              <span>{error}</span>
            </div>
          )}
          <DialogFooter>
            <Button
              variant="outline"
              onClick={handleCancelCreate}
              disabled={isCreating}
            >
              Cancelar
            </Button>
            <Button
              onClick={handleCreateCollection}
              disabled={isCreating}
            >
              {isCreating ? (
                <>
                  <Loader2 className="w-4 h-4 mr-2 animate-spin" />
                  Creando...
                </>
              ) : (
                'Crear colección'
              )}
            </Button>
          </DialogFooter>
        </DialogContent>
      </Dialog>
    </>
  )
 }
--- a/frontend/src/components/Dashboard.tsx
+++ b/frontend/src/components/Dashboard.tsx
@@ -15,6 +15,10 @@ import { Checkbox } from '@/components/ui/checkbox'
 import { FileUpload } from './FileUpload'
 import { DeleteConfirmDialog } from './DeleteConfirmDialog'
 import { PDFPreviewModal } from './PDFPreviewModal'
 import { CollectionVerifier } from './CollectionVerifier'
 import { ChunkViewerModal } from './ChunkViewerModal'
 import { ChunkingConfigModal, type ChunkingConfig } from './ChunkingConfigModal'
 import { ChunkPreviewPanel } from './ChunkPreviewPanel'
 import {
  Upload,
  Download,
@@ -22,7 +26,8 @@ import {
  Search,
  FileText,
  Eye,
-  MessageSquare
+  MessageSquare,
  Scissors
 } from 'lucide-react'
 export function Dashboard() {
@@ -52,6 +57,20 @@ export function Dashboard() {
  const [previewFileTema, setPreviewFileTema] = useState<string | undefined>(undefined)
  const [loadingPreview, setLoadingPreview] = useState(false)
  // Estados para el modal de chunks
  const [chunkViewerOpen, setChunkViewerOpen] = useState(false)
  const [chunkFileName, setChunkFileName] = useState('')
  const [chunkFileTema, setChunkFileTema] = useState('')
  // Estados para chunking
  const [chunkingConfigOpen, setChunkingConfigOpen] = useState(false)
  const [chunkingFileName, setChunkingFileName] = useState('')
  const [chunkingFileTema, setChunkingFileTema] = useState('')
  const [chunkingCollectionName, setChunkingCollectionName] = useState('')
  const [chunkPreviewOpen, setChunkPreviewOpen] = useState(false)
  const [chunkingConfig, setChunkingConfig] = useState<ChunkingConfig | null>(null)
  useEffect(() => {
    loadFiles()
  }, [selectedTema])
@@ -173,6 +192,54 @@ export function Dashboard() {
    }
  }
  // Abrir modal de chunks
  const handleViewChunks = (filename: string, tema: string) => {
    if (!tema) {
      alert('No hay tema seleccionado. Por favor selecciona un tema primero.')
      return
    }
    setChunkFileName(filename)
    setChunkFileTema(tema)
    setChunkViewerOpen(true)
  }
  // Handlers para chunking
  const handleStartChunking = (filename: string, tema: string) => {
    if (!tema) {
      alert('No hay tema seleccionado. Por favor selecciona un tema primero.')
      return
    }
    setChunkingFileName(filename)
    setChunkingFileTema(tema)
    setChunkingCollectionName(tema) // Usar el tema como nombre de colección
    setChunkingConfigOpen(true)
  }
  const handlePreviewChunking = (config: ChunkingConfig) => {
    setChunkingConfig(config)
    setChunkingConfigOpen(false)
    setChunkPreviewOpen(true)
  }
  const handleAcceptChunking = async (config: ChunkingConfig) => {
    try {
      const result = await api.processChunkingFull(config)
      alert(`Procesamiento completado: ${result.chunks_added} chunks agregados a ${result.collection_name}`)
      // Recargar archivos para actualizar el estado
      loadFiles()
    } catch (error) {
      console.error('Error processing PDF:', error)
      throw error
    }
  }
  const handleCancelChunking = () => {
    setChunkPreviewOpen(false)
    setChunkingConfig(null)
    // Opcionalmente volver al modal de configuración
    // setChunkingConfigOpen(true)
  }
  const filteredFiles = files.filter(file =>
    file.name.toLowerCase().includes(searchTerm.toLowerCase())
  )
@@ -350,10 +417,19 @@ export function Dashboard() {
                        >
                          <Download className="w-4 h-4" />
                        </Button>
                        <Button
                          variant="ghost"
                          size="sm"
                          title="Procesar con chunking"
                          onClick={() => handleStartChunking(file.name, file.tema)}
                        >
                          <Scissors className="w-4 h-4" />
                        </Button>
                        <Button
                          variant="ghost"
                          size="sm"
                          title="Ver chunks"
                          onClick={() => handleViewChunks(file.name, file.tema)}
                        >
                          <Eye className="w-4 h-4" />
                        </Button>
@@ -406,6 +482,41 @@ export function Dashboard() {
        fileName={previewFileName}
        onDownload={handleDownloadFromPreview}
      />
      {/* Collection Verifier - Verifica/crea colección cuando se selecciona un tema */}
      <CollectionVerifier
        tema={selectedTema}
        onVerified={(exists) => {
          console.log(`Collection ${selectedTema} exists: ${exists}`)
        }}
      />
      {/* Chunk Viewer Modal */}
      <ChunkViewerModal
        isOpen={chunkViewerOpen}
        onClose={() => setChunkViewerOpen(false)}
        fileName={chunkFileName}
        tema={chunkFileTema}
      />
      {/* Modal de configuración de chunking */}
      <ChunkingConfigModal
        isOpen={chunkingConfigOpen}
        onClose={() => setChunkingConfigOpen(false)}
        fileName={chunkingFileName}
        tema={chunkingFileTema}
        collectionName={chunkingCollectionName}
        onPreview={handlePreviewChunking}
      />
      {/* Panel de preview de chunks */}
      <ChunkPreviewPanel
        isOpen={chunkPreviewOpen}
        onClose={() => setChunkPreviewOpen(false)}
        config={chunkingConfig}
        onAccept={handleAcceptChunking}
        onCancel={handleCancelChunking}
      />
    </div>
  )
 }
--- a/frontend/src/components/ui/select.tsx
+++ b/frontend/src/components/ui/select.tsx
@@ -0,0 +1,159 @@
 "use client"
 import * as React from "react"
 import * as SelectPrimitive from "@radix-ui/react-select"
 import { Check, ChevronDown, ChevronUp } from "lucide-react"
 import { cn } from "@/lib/utils"
 const Select = SelectPrimitive.Root
 const SelectGroup = SelectPrimitive.Group
 const SelectValue = SelectPrimitive.Value
 const SelectTrigger = React.forwardRef<
  React.ElementRef<typeof SelectPrimitive.Trigger>,
  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Trigger>
 >(({ className, children, ...props }, ref) => (
  <SelectPrimitive.Trigger
    ref={ref}
    className={cn(
      "flex h-9 w-full items-center justify-between whitespace-nowrap rounded-md border border-input bg-transparent px-3 py-2 text-sm shadow-sm ring-offset-background data-[placeholder]:text-muted-foreground focus:outline-none focus:ring-1 focus:ring-ring disabled:cursor-not-allowed disabled:opacity-50 [&>span]:line-clamp-1",
      className
    )}
    {...props}
  >
    {children}
    <SelectPrimitive.Icon asChild>
      <ChevronDown className="h-4 w-4 opacity-50" />
    </SelectPrimitive.Icon>
  </SelectPrimitive.Trigger>
 ))
 SelectTrigger.displayName = SelectPrimitive.Trigger.displayName
 const SelectScrollUpButton = React.forwardRef<
  React.ElementRef<typeof SelectPrimitive.ScrollUpButton>,
  React.ComponentPropsWithoutRef<typeof SelectPrimitive.ScrollUpButton>
 >(({ className, ...props }, ref) => (
  <SelectPrimitive.ScrollUpButton
    ref={ref}
    className={cn(
      "flex cursor-default items-center justify-center py-1",
      className
    )}
    {...props}
  >
    <ChevronUp className="h-4 w-4" />
  </SelectPrimitive.ScrollUpButton>
 ))
 SelectScrollUpButton.displayName = SelectPrimitive.ScrollUpButton.displayName
 const SelectScrollDownButton = React.forwardRef<
  React.ElementRef<typeof SelectPrimitive.ScrollDownButton>,
  React.ComponentPropsWithoutRef<typeof SelectPrimitive.ScrollDownButton>
 >(({ className, ...props }, ref) => (
  <SelectPrimitive.ScrollDownButton
    ref={ref}
    className={cn(
      "flex cursor-default items-center justify-center py-1",
      className
    )}
    {...props}
  >
    <ChevronDown className="h-4 w-4" />
  </SelectPrimitive.ScrollDownButton>
 ))
 SelectScrollDownButton.displayName =
  SelectPrimitive.ScrollDownButton.displayName
 const SelectContent = React.forwardRef<
  React.ElementRef<typeof SelectPrimitive.Content>,
  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Content>
 >(({ className, children, position = "popper", ...props }, ref) => (
  <SelectPrimitive.Portal>
    <SelectPrimitive.Content
      ref={ref}
      className={cn(
        "relative z-50 max-h-[--radix-select-content-available-height] min-w-[8rem] overflow-y-auto overflow-x-hidden rounded-md border bg-popover text-popover-foreground shadow-md data-[state=open]:animate-in data-[state=closed]:animate-out data-[state=closed]:fade-out-0 data-[state=open]:fade-in-0 data-[state=closed]:zoom-out-95 data-[state=open]:zoom-in-95 data-[side=bottom]:slide-in-from-top-2 data-[side=left]:slide-in-from-right-2 data-[side=right]:slide-in-from-left-2 data-[side=top]:slide-in-from-bottom-2 origin-[--radix-select-content-transform-origin]",
        position === "popper" &&
          "data-[side=bottom]:translate-y-1 data-[side=left]:-translate-x-1 data-[side=right]:translate-x-1 data-[side=top]:-translate-y-1",
        className
      )}
      position={position}
      {...props}
    >
      <SelectScrollUpButton />
      <SelectPrimitive.Viewport
        className={cn(
          "p-1",
          position === "popper" &&
            "h-[var(--radix-select-trigger-height)] w-full min-w-[var(--radix-select-trigger-width)]"
        )}
      >
        {children}
      </SelectPrimitive.Viewport>
      <SelectScrollDownButton />
    </SelectPrimitive.Content>
  </SelectPrimitive.Portal>
 ))
 SelectContent.displayName = SelectPrimitive.Content.displayName
 const SelectLabel = React.forwardRef<
  React.ElementRef<typeof SelectPrimitive.Label>,
  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Label>
 >(({ className, ...props }, ref) => (
  <SelectPrimitive.Label
    ref={ref}
    className={cn("px-2 py-1.5 text-sm font-semibold", className)}
    {...props}
  />
 ))
 SelectLabel.displayName = SelectPrimitive.Label.displayName
 const SelectItem = React.forwardRef<
  React.ElementRef<typeof SelectPrimitive.Item>,
  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Item>
 >(({ className, children, ...props }, ref) => (
  <SelectPrimitive.Item
    ref={ref}
    className={cn(
      "relative flex w-full cursor-default select-none items-center rounded-sm py-1.5 pl-2 pr-8 text-sm outline-none focus:bg-accent focus:text-accent-foreground data-[disabled]:pointer-events-none data-[disabled]:opacity-50",
      className
    )}
    {...props}
  >
    <span className="absolute right-2 flex h-3.5 w-3.5 items-center justify-center">
      <SelectPrimitive.ItemIndicator>
        <Check className="h-4 w-4" />
      </SelectPrimitive.ItemIndicator>
    </span>
    <SelectPrimitive.ItemText>{children}</SelectPrimitive.ItemText>
  </SelectPrimitive.Item>
 ))
 SelectItem.displayName = SelectPrimitive.Item.displayName
 const SelectSeparator = React.forwardRef<
  React.ElementRef<typeof SelectPrimitive.Separator>,
  React.ComponentPropsWithoutRef<typeof SelectPrimitive.Separator>
 >(({ className, ...props }, ref) => (
  <SelectPrimitive.Separator
    ref={ref}
    className={cn("-mx-1 my-1 h-px bg-muted", className)}
    {...props}
  />
 ))
 SelectSeparator.displayName = SelectPrimitive.Separator.displayName
 export {
  Select,
  SelectGroup,
  SelectValue,
  SelectTrigger,
  SelectContent,
  SelectLabel,
  SelectItem,
  SelectSeparator,
  SelectScrollUpButton,
  SelectScrollDownButton,
 }
--- a/frontend/src/components/ui/switch.tsx
+++ b/frontend/src/components/ui/switch.tsx
@@ -0,0 +1,27 @@
 import * as React from "react"
 import * as SwitchPrimitives from "@radix-ui/react-switch"
 import { cn } from "@/lib/utils"
 const Switch = React.forwardRef<
  React.ElementRef<typeof SwitchPrimitives.Root>,
  React.ComponentPropsWithoutRef<typeof SwitchPrimitives.Root>
 >(({ className, ...props }, ref) => (
  <SwitchPrimitives.Root
    className={cn(
      "peer inline-flex h-5 w-9 shrink-0 cursor-pointer items-center rounded-full border-2 border-transparent shadow-sm transition-colors focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 focus-visible:ring-offset-background disabled:cursor-not-allowed disabled:opacity-50 data-[state=checked]:bg-primary data-[state=unchecked]:bg-input",
      className
    )}
    {...props}
    ref={ref}
  >
    <SwitchPrimitives.Thumb
      className={cn(
        "pointer-events-none block h-4 w-4 rounded-full bg-background shadow-lg ring-0 transition-transform data-[state=checked]:translate-x-4 data-[state=unchecked]:translate-x-0"
      )}
    />
  </SwitchPrimitives.Root>
 ))
 Switch.displayName = SwitchPrimitives.Root.displayName
 export { Switch }
--- a/frontend/src/components/ui/tabs.tsx
+++ b/frontend/src/components/ui/tabs.tsx
@@ -0,0 +1,53 @@
 import * as React from "react"
 import * as TabsPrimitive from "@radix-ui/react-tabs"
 import { cn } from "@/lib/utils"
 const Tabs = TabsPrimitive.Root
 const TabsList = React.forwardRef<
  React.ElementRef<typeof TabsPrimitive.List>,
  React.ComponentPropsWithoutRef<typeof TabsPrimitive.List>
 >(({ className, ...props }, ref) => (
  <TabsPrimitive.List
    ref={ref}
    className={cn(
      "inline-flex h-9 items-center justify-center rounded-lg bg-muted p-1 text-muted-foreground",
      className
    )}
    {...props}
  />
 ))
 TabsList.displayName = TabsPrimitive.List.displayName
 const TabsTrigger = React.forwardRef<
  React.ElementRef<typeof TabsPrimitive.Trigger>,
  React.ComponentPropsWithoutRef<typeof TabsPrimitive.Trigger>
 >(({ className, ...props }, ref) => (
  <TabsPrimitive.Trigger
    ref={ref}
    className={cn(
      "inline-flex items-center justify-center whitespace-nowrap rounded-md px-3 py-1 text-sm font-medium ring-offset-background transition-all focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:pointer-events-none disabled:opacity-50 data-[state=active]:bg-background data-[state=active]:text-foreground data-[state=active]:shadow",
      className
    )}
    {...props}
  />
 ))
 TabsTrigger.displayName = TabsPrimitive.Trigger.displayName
 const TabsContent = React.forwardRef<
  React.ElementRef<typeof TabsPrimitive.Content>,
  React.ComponentPropsWithoutRef<typeof TabsPrimitive.Content>
 >(({ className, ...props }, ref) => (
  <TabsPrimitive.Content
    ref={ref}
    className={cn(
      "mt-2 ring-offset-background focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2",
      className
    )}
    {...props}
  />
 ))
 TabsContent.displayName = TabsPrimitive.Content.displayName
 export { Tabs, TabsList, TabsTrigger, TabsContent }
--- a/frontend/src/components/ui/textarea.tsx
+++ b/frontend/src/components/ui/textarea.tsx
@@ -0,0 +1,22 @@
 import * as React from "react"
 import { cn } from "@/lib/utils"
 const Textarea = React.forwardRef<
  HTMLTextAreaElement,
  React.ComponentProps<"textarea">
 >(({ className, ...props }, ref) => {
  return (
    <textarea
      className={cn(
        "flex min-h-[60px] w-full rounded-md border border-input bg-transparent px-3 py-2 text-base shadow-sm placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-ring disabled:cursor-not-allowed disabled:opacity-50 md:text-sm",
        className
      )}
      ref={ref}
      {...props}
    />
  )
 })
 Textarea.displayName = "Textarea"
 export { Textarea }
--- a/frontend/src/services/api.ts
+++ b/frontend/src/services/api.ts
@@ -188,4 +188,236 @@ export const api = {
    return data.url
  },
  // ============================================================================
  // Vector Database / Qdrant Operations
  // ============================================================================
  // Health check de la base de datos vectorial
  vectorHealthCheck: async (): Promise<{ status: string; db_type: string; message: string }> => {
    const response = await fetch(`${API_BASE_URL}/vectors/health`)
    if (!response.ok) throw new Error('Error checking vector DB health')
    return response.json()
  },
  // Verificar si una colección existe
  checkCollectionExists: async (collectionName: string): Promise<{ exists: boolean; collection_name: string }> => {
    const response = await fetch(`${API_BASE_URL}/vectors/collections/exists`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
      },
      body: JSON.stringify({ collection_name: collectionName }),
    })
    if (!response.ok) throw new Error('Error checking collection')
    return response.json()
  },
  // Crear una nueva colección
  createCollection: async (
    collectionName: string,
    vectorSize: number = 3072,
    distance: string = 'Cosine'
  ): Promise<{ success: boolean; collection_name: string; message: string }> => {
    const response = await fetch(`${API_BASE_URL}/vectors/collections/create`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
      },
      body: JSON.stringify({
        collection_name: collectionName,
        vector_size: vectorSize,
        distance: distance,
      }),
    })
    if (!response.ok) {
      const error = await response.json()
      throw new Error(error.detail || 'Error creating collection')
    }
    return response.json()
  },
  // Eliminar una colección
  deleteCollection: async (collectionName: string): Promise<{ success: boolean; collection_name: string; message: string }> => {
    const response = await fetch(`${API_BASE_URL}/vectors/collections/${encodeURIComponent(collectionName)}`, {
      method: 'DELETE',
    })
    if (!response.ok) throw new Error('Error deleting collection')
    return response.json()
  },
  // Obtener información de una colección
  getCollectionInfo: async (collectionName: string): Promise<{
    name: string
    vectors_count: number
    vectors_config: { size: number; distance: string }
    status: string
  }> => {
    const response = await fetch(`${API_BASE_URL}/vectors/collections/${encodeURIComponent(collectionName)}/info`)
    if (!response.ok) throw new Error('Error getting collection info')
    return response.json()
  },
  // Verificar si un archivo existe en una colección
  checkFileExistsInCollection: async (
    collectionName: string,
    fileName: string
  ): Promise<{ exists: boolean; collection_name: string; file_name: string; chunk_count?: number }> => {
    const response = await fetch(`${API_BASE_URL}/vectors/files/exists`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
      },
      body: JSON.stringify({
        collection_name: collectionName,
        file_name: fileName,
      }),
    })
    if (!response.ok) throw new Error('Error checking file in collection')
    return response.json()
  },
  // Obtener chunks de un archivo
  getChunksByFile: async (
    collectionName: string,
    fileName: string,
    limit?: number
  ): Promise<{
    collection_name: string
    file_name: string
    chunks: Array<{ id: string; payload: any; vector?: number[] }>
    total_chunks: number
  }> => {
    const url = limit
      ? `${API_BASE_URL}/vectors/collections/${encodeURIComponent(collectionName)}/files/${encodeURIComponent(fileName)}/chunks?limit=${limit}`
      : `${API_BASE_URL}/vectors/collections/${encodeURIComponent(collectionName)}/files/${encodeURIComponent(fileName)}/chunks`
    const response = await fetch(url)
    if (!response.ok) throw new Error('Error getting chunks')
    return response.json()
  },
  // Eliminar archivo de colección
  deleteFileFromCollection: async (
    collectionName: string,
    fileName: string
  ): Promise<{ success: boolean; collection_name: string; file_name: string; chunks_deleted: number; message: string }> => {
    const response = await fetch(
      `${API_BASE_URL}/vectors/collections/${encodeURIComponent(collectionName)}/files/${encodeURIComponent(fileName)}`,
      { method: 'DELETE' }
    )
    if (!response.ok) throw new Error('Error deleting file from collection')
    return response.json()
  },
  // Agregar chunks a una colección
  addChunks: async (
    collectionName: string,
    chunks: Array<{ id: string; vector: number[]; payload: any }>
  ): Promise<{ success: boolean; collection_name: string; chunks_added: number; message: string }> => {
    const response = await fetch(`${API_BASE_URL}/vectors/chunks/add`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
      },
      body: JSON.stringify({
        collection_name: collectionName,
        chunks: chunks,
      }),
    })
    if (!response.ok) throw new Error('Error adding chunks')
    return response.json()
  },
  // ============================================================================
  // Chunking Operations
  // ============================================================================
  // Obtener perfiles de chunking predefinidos
  getChunkingProfiles: async (): Promise<{
    profiles: Array<{
      id: string
      name: string
      description: string
      max_tokens: number
      target_tokens: number
      chunk_size: number
      chunk_overlap: number
      use_llm: boolean
    }>
  }> => {
    const response = await fetch(`${API_BASE_URL}/chunking/profiles`)
    if (!response.ok) throw new Error('Error fetching chunking profiles')
    return response.json()
  },
  // Generar preview de chunks (hasta 3 chunks)
  generateChunkPreview: async (config: {
    file_name: string
    tema: string
    max_tokens?: number
    target_tokens?: number
    chunk_size?: number
    chunk_overlap?: number
    use_llm?: boolean
    custom_instructions?: string
  }): Promise<{
    success: boolean
    file_name: string
    tema: string
    chunks: Array<{
      index: number
      text: string
      page: number
      file_name: string
      tokens: number
    }>
    message: string
  }> => {
    const response = await fetch(`${API_BASE_URL}/chunking/preview`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
      },
      body: JSON.stringify(config),
    })
    if (!response.ok) {
      const error = await response.json()
      throw new Error(error.detail || 'Error generating preview')
    }
    return response.json()
  },
  // Procesar PDF completo
  processChunkingFull: async (config: {
    file_name: string
    tema: string
    collection_name: string
    max_tokens?: number
    target_tokens?: number
    chunk_size?: number
    chunk_overlap?: number
    use_llm?: boolean
    custom_instructions?: string
  }): Promise<{
    success: boolean
    collection_name: string
    file_name: string
    total_chunks: number
    chunks_added: number
    message: string
  }> => {
    const response = await fetch(`${API_BASE_URL}/chunking/process`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
      },
      body: JSON.stringify(config),
    })
    if (!response.ok) {
      const error = await response.json()
      throw new Error(error.detail || 'Error processing PDF')
    }
    return response.json()
  },
 }