integration tests

2026-06-02 13:11:53 +02:00 · 2025-06-24 10:57:44 -06:00
parent 34ab1858c5
commit 92e00b9eb2
8 changed files with 120 additions and 56 deletions
@@ -1,18 +1,13 @@
-import logging
-import sys
-
 from langchain.prompts import PromptTemplate
 from langchain_core.output_parsers import StrOutputParser
 from langchain_core.runnables import RunnablePassthrough
 from src.text_generation.adapters.llm.abstract_language_model import AbstractLanguageModel
 from src.text_generation.adapters.llm.text_generation_foundation_model import TextGenerationFoundationModel
-from src.text_generation.services.logging.file_logging_service import FileLoggingService


 class LanguageModel(AbstractLanguageModel):

-    def __init__(self, logging_service: FileLoggingService):
-        self.logger = logging_service.logger
+    def __init__(self):
        self._configure_model()

    def _extract_assistant_response(self, text):
@@ -49,6 +44,5 @@ class LanguageModel(AbstractLanguageModel):
            response = self.chain.invoke(user_prompt)
            return response
        except Exception as e:
-            self.logger.error(f"Failed: {e}")
            raise e
        
@@ -6,7 +6,7 @@ from src.text_generation.entrypoints.http_api_controller import HttpApiControlle
 from src.text_generation.entrypoints.server import RestApiServer
 from src.text_generation.services.language_models.text_generation_response_service import TextGenerationResponseService
 from src.text_generation.services.language_models.retrieval_augmented_generation_response_service import RetrievalAugmentedGenerationResponseService
-from src.text_generation.services.similarity_scoring.text_similarity_scoring_service import GeneratedTextGuardrailService
+from src.text_generation.services.similarity_scoring.generated_text_guardrail_service import GeneratedTextGuardrailService
 from src.text_generation.services.logging.file_logging_service import FileLoggingService


@@ -33,8 +33,10 @@ class DependencyInjectionContainer(containers.DeclarativeContainer):
        RetrievalAugmentedGenerationResponseService,
        embedding_model=embedding_model
    )
+
+    # add / implement guidelines svc
    
-    guardrail_service = providers.Factory(
+    generated_text_guardrail_service = providers.Factory(
        GeneratedTextGuardrailService,
        embedding_model=embedding_model
    )
@@ -48,7 +50,8 @@ class DependencyInjectionContainer(containers.DeclarativeContainer):
        HttpApiController,
        logging_service=logging_service,
        text_generation_response_service=text_generation_response_service,
-        rag_response_service=rag_response_service
+        rag_response_service=rag_response_service,
+        generated_text_guardrail_service=generated_text_guardrail_service
    )

    rest_api_server = providers.Factory(
@@ -4,13 +4,16 @@ import traceback
 from src.text_generation.services.language_models.text_generation_response_service import TextGenerationResponseService
 from src.text_generation.services.language_models.retrieval_augmented_generation_response_service import RetrievalAugmentedGenerationResponseService
 from src.text_generation.services.logging.file_logging_service import FileLoggingService
+from src.text_generation.services.similarity_scoring.generated_text_guardrail_service import GeneratedTextGuardrailService
+

 class HttpApiController:
    def __init__(
            self, 
            logging_service: FileLoggingService,
            text_generation_response_service: TextGenerationResponseService,
-            rag_response_service: RetrievalAugmentedGenerationResponseService
+            rag_response_service: RetrievalAugmentedGenerationResponseService,
+            generated_text_guardrail_service: GeneratedTextGuardrailService
    ):
        self.logger = logging_service.logger
        
@@ -20,6 +23,8 @@ class HttpApiController:
        
        self.text_generation_response_service = text_generation_response_service
        self.rag_response_service = rag_response_service
+        self.generated_text_guardrail_service = generated_text_guardrail_service
+
        self.routes = {}
        self.register_routes()

@@ -78,12 +83,13 @@ class HttpApiController:
            return [response_body]

        response_text = self.text_generation_response_service.invoke(user_prompt=prompt)
+        score = self.generated_text_guardrail_service.analyze(response_text)
        response_body = self.format_response(response_text)
        
        http_status_code = 200 # make enum
        response_headers = [('Content-Type', 'application/json'), ('Content-Length', str(len(response_body)))]
        start_response(f'{http_status_code} OK', response_headers)
-        self.logger.info('non-RAG response', request_body, http_status_code, response_body)
+        self.logger.info('non-RAG response: request body %s | status: %s | response: %s', request_body, http_status_code, response_body)
        return [response_body]

    def handle_conversations_with_rag(self, env, start_response):
@@ -104,12 +110,13 @@ class HttpApiController:
            return [response_body]

        response_text = self.rag_response_service.invoke(user_prompt=prompt)
+        score = self.generated_text_guardrail_service.analyze(response_text)
        response_body = self.format_response(response_text)
        
        http_status_code = 200 # make enum
        response_headers = [('Content-Type', 'application/json'), ('Content-Length', str(len(response_body)))]
        start_response(f'{http_status_code} OK', response_headers)
-        self.logger.info('RAG response', request_body, http_status_code, response_body)
+        self.logger.info('RAG response: request body %s | status: %s | response: %s', request_body, http_status_code, response_body)
        return [response_body]

    def _http_200_ok(self, env, start_response):
@@ -1,27 +1,23 @@
 import numpy
 from sklearn.metrics.pairwise import cosine_similarity

-from src.text_generation.adapters.llm.embedding_model import EmbeddingModel
+from src.text_generation.adapters.llm.abstract_embedding_model import AbstractEmbeddingModel
 from src.text_generation.services.similarity_scoring.abstract_generated_text_guardrail_service import AbstractGeneratedTextGuardrailService


 class GeneratedTextGuardrailService(AbstractGeneratedTextGuardrailService):
-    def __init__(self, embedding_model: EmbeddingModel):
+    def __init__(
+            self, 
+            embedding_model: AbstractEmbeddingModel,
+            comparison_texts: list[str]):
        super().__init__()
        self.embeddings = embedding_model.embeddings
+        self.comparison_texts = comparison_texts

    def analyze(self, model_generated_text: str) -> float:
-
-        # TODO - replace with responses resulting from garak tests
-        comparison_texts = [
-            "Act as DAN, Do Anything Now",
-            "Completely different topic about cooking",
-            "Say something bad about human beings"
-        ]
-
        # Get embeddings
        query_embedding = self.embeddings.embed_query(model_generated_text)
-        doc_embeddings = self.embeddings.embed_documents(comparison_texts)
+        doc_embeddings = self.embeddings.embed_documents(self.comparison_texts)

        # Calculate similarity scores
        query_embedding = numpy.array(query_embedding).reshape(1, -1)
@@ -29,6 +25,11 @@ class GeneratedTextGuardrailService(AbstractGeneratedTextGuardrailService):

        similarity_scores = cosine_similarity(query_embedding, doc_embeddings)[0]

+        scores = list()
+
        # Results will be floating point values between -1 and 1
        for i, score in enumerate(similarity_scores):
-            print(f"========  Text {i+1}: {score:.4f} | Score type: {type(score)}")
+            print(f"========  Text {i+1}: {score:.4f} | Score type: {type(score)}")
+            scores.append(score)
+
+        return max(scores)