Initial Python rewrite

2026-02-19 17:50:14 +00:00
parent da95a64fb7
commit faa04a0d01
158 changed files with 5122 additions and 1144 deletions
--- a/src/capa_de_integracion/services/rag_service.py
+++ b/src/capa_de_integracion/services/rag_service.py
@@ -0,0 +1,139 @@
+import logging
+
+import httpx
+from pydantic import BaseModel, Field
+
+from capa_de_integracion.config import Settings
+
+logger = logging.getLogger(__name__)
+
+
+class Message(BaseModel):
+    """OpenAI-style message format."""
+
+    role: str = Field(..., description="Role: system, user, or assistant")
+    content: str = Field(..., description="Message content")
+
+
+class RAGRequest(BaseModel):
+    """Request model for RAG endpoint."""
+
+    messages: list[Message] = Field(..., description="Conversation history")
+
+
+class RAGResponse(BaseModel):
+    """Response model from RAG endpoint."""
+
+    response: str = Field(..., description="Generated response from RAG")
+
+
+class RAGService:
+    """Highly concurrent HTTP client for calling RAG endpoints.
+
+    Uses httpx AsyncClient with connection pooling for optimal performance
+    when handling multiple concurrent requests.
+    """
+
+    def __init__(
+        self,
+        settings: Settings,
+        max_connections: int = 100,
+        max_keepalive_connections: int = 20,
+        timeout: float = 30.0,
+    ) -> None:
+        """Initialize RAG service with connection pooling.
+
+        Args:
+            settings: Application settings
+            max_connections: Maximum number of concurrent connections
+            max_keepalive_connections: Maximum number of idle connections to keep alive
+            timeout: Request timeout in seconds
+
+        """
+        self.settings = settings
+        self.rag_endpoint_url = settings.rag_endpoint_url
+        self.timeout = timeout
+
+        # Configure connection limits for high concurrency
+        limits = httpx.Limits(
+            max_connections=max_connections,
+            max_keepalive_connections=max_keepalive_connections,
+        )
+
+        # Create async client with connection pooling
+        self._client = httpx.AsyncClient(
+            limits=limits,
+            timeout=httpx.Timeout(timeout),
+            http2=True,  # Enable HTTP/2 for better performance
+        )
+
+        logger.info(
+            f"RAGService initialized with endpoint: {self.rag_endpoint_url}, "
+            f"max_connections: {max_connections}, timeout: {timeout}s",
+        )
+
+    async def query(self, messages: list[dict[str, str]]) -> str:
+        """Send conversation history to RAG endpoint and get response.
+
+        Args:
+            messages: OpenAI-style conversation history
+                     e.g., [{"role": "user", "content": "Hello"}, ...]
+
+        Returns:
+            Response string from RAG endpoint
+
+        Raises:
+            httpx.HTTPError: If HTTP request fails
+            ValueError: If response format is invalid
+
+        """
+        try:
+            # Validate and construct request
+            message_objects = [Message(**msg) for msg in messages]
+            request = RAGRequest(messages=message_objects)
+
+            # Make async HTTP POST request
+            logger.debug(f"Sending RAG request with {len(messages)} messages")
+
+            response = await self._client.post(
+                self.rag_endpoint_url,
+                json=request.model_dump(),
+                headers={"Content-Type": "application/json"},
+            )
+
+            # Raise exception for HTTP errors
+            response.raise_for_status()
+
+            # Parse response
+            response_data = response.json()
+            rag_response = RAGResponse(**response_data)
+
+            logger.debug(f"RAG response received: {len(rag_response.response)} chars")
+            return rag_response.response
+
+        except httpx.HTTPStatusError as e:
+            logger.exception(
+                f"HTTP error calling RAG endpoint: {e.response.status_code} - {e.response.text}",
+            )
+            raise
+        except httpx.RequestError as e:
+            logger.exception(f"Request error calling RAG endpoint: {e!s}")
+            raise
+        except Exception as e:
+            logger.error(
+                f"Unexpected error calling RAG endpoint: {e!s}", exc_info=True,
+            )
+            raise
+
+    async def close(self) -> None:
+        """Close the HTTP client and release connections."""
+        await self._client.aclose()
+        logger.info("RAGService client closed")
+
+    async def __aenter__(self):
+        """Async context manager entry."""
+        return self
+
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        """Async context manager exit."""
+        await self.close()