Bakalarska_praca/Backend/model.py

import json
import requests
import logging
import time
import re
from requests.exceptions import HTTPError
from elasticsearch import Elasticsearch
from langchain.chains import SequentialChain
from langchain.chains import LLMChain, SequentialChain
from langchain_huggingface import HuggingFaceEmbeddings
from langchain_elasticsearch import ElasticsearchStore
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.docstore.document import Document
from googletrans import Translator  # Translator for final polishing

logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# Load configuration
config_file_path = "config.json"
with open(config_file_path, 'r') as config_file:
    config = json.load(config_file)

# Load Mistral API key
mistral_api_key = "hXDC4RBJk1qy5pOlrgr01GtOlmyCBaNs"
if not mistral_api_key:
    raise ValueError("Mistral API key not found in configuration.")


###############################################################################
#                       Function to translate entire text to Slovak           #
###############################################################################
translator = Translator()

def translate_to_slovak(text: str) -> str:
    """
    Translates the entire text into Slovak.
    Logs the text before and after translation.
    """
    if not text.strip():
        return text

    try:
        # 1) Slovak (or any language) -> English
        mid_result = translator.translate(text, src='auto', dest='en').text

        # 2) English -> Slovak
        final_result = translator.translate(mid_result, src='en', dest='sk').text

        return final_result
    except Exception as e:
        logger.error(f"Translation error: {e}")
        return text  # fallback to the original text


###############################################################################
#                             Custom Mistral LLM                              #
###############################################################################
class CustomMistralLLM:
    def __init__(self, api_key: str, endpoint_url: str, model_name: str):
        self.api_key = api_key
        self.endpoint_url = endpoint_url
        self.model_name = model_name

    def generate_text(self, prompt: str, max_tokens=512, temperature=0.7, retries=3, delay=2):
        headers = {
            "Authorization": f"Bearer {self.api_key}",
            "Content-Type": "application/json"
        }
        payload = {
            "model": self.model_name,
            "messages": [{"role": "user", "content": prompt}],
            "max_tokens": max_tokens,
            "temperature": temperature
        }
        attempt = 0
        while attempt < retries:
            try:
                response = requests.post(self.endpoint_url, headers=headers, json=payload)
                response.raise_for_status()
                result = response.json()
                logger.info(f"Full response from model {self.model_name}: {result}")
                return result.get("choices", [{}])[0].get("message", {}).get("content", "No response")
            except HTTPError as e:
                if response.status_code == 429:  # Too Many Requests
                    logger.warning(f"Rate limit exceeded. Waiting {delay} seconds before retry.")
                    time.sleep(delay)
                    attempt += 1
                else:
                    logger.error(f"HTTP Error: {e}")
                    raise e
            except Exception as e:
                logger.error(f"Error: {str(e)}")
                raise e
        raise Exception("Reached maximum number of retries for API request")


###############################################################################
#                 Initialize embeddings and Elasticsearch store               #
###############################################################################
logger.info("Loading HuggingFaceEmbeddings model...")
embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2")

index_name = 'drug_docs'

# Connect to Elasticsearch
if config.get("useCloud", False):
    logger.info("Using cloud Elasticsearch.")
    cloud_id = "tt:dXMtZWFzdC0yLmF3cy5lbGFzdGljLWNsb3VkLmNvbTo0NDMkOGM3ODQ0ZWVhZTEyNGY3NmFjNjQyNDFhNjI4NmVhYzMkZTI3YjlkNTQ0ODdhNGViNmEyMTcxMjMxNmJhMWI0ZGU="
    vectorstore = ElasticsearchStore(
        es_cloud_id=cloud_id,
        index_name='drug_docs',
        embedding=embeddings,
        es_user="elastic",
        es_password="sSz2BEGv56JRNjGFwoQ191RJ"
    )
else:
    logger.info("Using local Elasticsearch.")
    vectorstore = ElasticsearchStore(
        es_url="http://localhost:9200",
        index_name=index_name,
        embedding=embeddings,
    )

logger.info(f"Connected to {'cloud' if config.get('useCloud', False) else 'local'} Elasticsearch.")


###############################################################################
#                 Initialize Mistral models (small & large)                   #
###############################################################################
llm_small = CustomMistralLLM(
    api_key=mistral_api_key,
    endpoint_url="https://api.mistral.ai/v1/chat/completions",
    model_name="mistral-small-latest"
)

llm_large = CustomMistralLLM(
    api_key=mistral_api_key,
    endpoint_url="https://api.mistral.ai/v1/chat/completions",
    model_name="mistral-large-latest"
)


###############################################################################
#                  Helper function to evaluate model output                   #
###############################################################################
def evaluate_results(query, summaries, model_name):
    """
    Evaluates results by:
      - text length,
      - presence of query keywords, etc.
    Returns a rating and explanation.
    """
    query_keywords = query.split()
    total_score = 0
    explanation = []

    for i, summary in enumerate(summaries):
        # Length-based scoring
        length_score = min(len(summary) / 100, 10)
        total_score += length_score
        explanation.append(f"Document {i+1}: Length score - {length_score}")

        # Keyword-based scoring
        keyword_matches = sum(1 for word in query_keywords if word.lower() in summary.lower())
        keyword_score = min(keyword_matches * 2, 10)
        total_score += keyword_score
        explanation.append(f"Document {i+1}: Keyword match score - {keyword_score}")

    final_score = total_score / len(summaries) if summaries else 0
    explanation_summary = "\n".join(explanation)

    logger.info(f"Evaluation for model {model_name}: {final_score}/10")
    logger.info(f"Explanation:\n{explanation_summary}")

    return {"rating": round(final_score, 2), "explanation": explanation_summary}


###############################################################################
#           Main function: process_query_with_mistral (Slovak prompt)         #
###############################################################################
def process_query_with_mistral(query, k=10):
    logger.info("Processing query started.")
    try:
        # --- Vector search ---
        vector_results = vectorstore.similarity_search(query, k=k)
        vector_documents = [hit.metadata.get('text', '') for hit in vector_results]

        max_docs = 5
        max_doc_length = 1000
        vector_documents = [doc[:max_doc_length] for doc in vector_documents[:max_docs]]

        if vector_documents:
            # Slovak prompt
            vector_prompt = (
                f"Otázka: '{query}'.\n"
                "Na základe nasledujúcich informácií o liekoch:\n"
                f"{vector_documents}\n\n"
                "Prosím, uveďte tri najvhodnejšie lieky alebo riešenia. Pre každý liek uveďte jeho názov a stručné, jasné vysvetlenie, prečo je vhodný. "
                "Odpovedajte priamo a ľudským, priateľským tónom v číslovanom zozname, bez nepotrebných úvodných fráz alebo opisu procesu. "
                "Odpoveď musí byť v slovenčine."
            )

            summary_small_vector = llm_small.generate_text(prompt=vector_prompt, max_tokens=700, temperature=0.7)
            summary_large_vector = llm_large.generate_text(prompt=vector_prompt, max_tokens=700, temperature=0.7)

            splitter = RecursiveCharacterTextSplitter(chunk_size=200, chunk_overlap=20)
            split_summary_small_vector = splitter.split_text(summary_small_vector)
            split_summary_large_vector = splitter.split_text(summary_large_vector)

            small_vector_eval = evaluate_results(query, split_summary_small_vector, 'Mistral Small')
            large_vector_eval = evaluate_results(query, split_summary_large_vector, 'Mistral Large')
        else:
            small_vector_eval = {"rating": 0, "explanation": "No results"}
            large_vector_eval = {"rating": 0, "explanation": "No results"}
            summary_small_vector = ""
            summary_large_vector = ""

        # --- Text search ---
        es_results = vectorstore.client.search(
            index=index_name,
            body={"size": k, "query": {"match": {"text": query}}}
        )
        text_documents = [hit['_source'].get('text', '') for hit in es_results['hits']['hits']]
        text_documents = [doc[:max_doc_length] for doc in text_documents[:max_docs]]

        if text_documents:
            # Slovak prompt
            text_prompt = (
                f"Otázka: '{query}'.\n"
                "Na základe nasledujúcich informácií o liekoch:\n"
                f"{text_documents}\n\n"
                "Prosím, uveďte tri najvhodnejšie lieky alebo riešenia. Pre každý liek uveďte jeho názov a stručné, jasné vysvetlenie, prečo je vhodný. "
                "Odpovedajte priamo a ľudským, priateľským tónom v číslovanom zozname, bez nepotrebných úvodných fráz alebo opisu procesu. "
                "Odpoveď musí byť v slovenčine."
            )

            summary_small_text = llm_small.generate_text(prompt=text_prompt, max_tokens=700, temperature=0.7)
            summary_large_text = llm_large.generate_text(prompt=text_prompt, max_tokens=700, temperature=0.7)

            split_summary_small_text = RecursiveCharacterTextSplitter(chunk_size=200, chunk_overlap=20).split_text(summary_small_text)
            split_summary_large_text = RecursiveCharacterTextSplitter(chunk_size=200, chunk_overlap=20).split_text(summary_large_text)

            small_text_eval = evaluate_results(query, split_summary_small_text, 'Mistral Small')
            large_text_eval = evaluate_results(query, split_summary_large_text, 'Mistral Large')
        else:
            small_text_eval = {"rating": 0, "explanation": "No results"}
            large_text_eval = {"rating": 0, "explanation": "No results"}
            summary_small_text = ""
            summary_large_text = ""

        # Combine all results and pick the best
        all_results = [
            {"eval": small_vector_eval, "summary": summary_small_vector, "model": "Mistral Small Vector"},
            {"eval": large_vector_eval, "summary": summary_large_vector, "model": "Mistral Large Vector"},
            {"eval": small_text_eval, "summary": summary_small_text, "model": "Mistral Small Text"},
            {"eval": large_text_eval, "summary": summary_large_text, "model": "Mistral Large Text"},
        ]

        best_result = max(all_results, key=lambda x: x["eval"]["rating"])
        logger.info(f"Best result from model {best_result['model']} with score {best_result['eval']['rating']}.")

        # Final translation to Slovak (with logs before/after)
        polished_answer = translate_to_slovak(best_result["summary"])

        return {
            "best_answer": polished_answer,
            "model": best_result["model"],
            "rating": best_result["eval"]["rating"],
            "explanation": best_result["eval"]["explanation"]
        }

    except Exception as e:
        logger.error(f"Error: {str(e)}")
        return {
            "best_answer": "An error occurred during query processing.",
            "error": str(e)
        }
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`import json`
added frontend/backend 2024-10-12 12:08:12 +00:00			`import requests`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`import logging`
			`import time`
			`import re`
			`from requests.exceptions import HTTPError`
			`from elasticsearch import Elasticsearch`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`from langchain.chains import SequentialChain`
			`from langchain.chains import LLMChain, SequentialChain`
added frontend/backend 2024-10-12 12:08:12 +00:00			`from langchain_huggingface import HuggingFaceEmbeddings`
			`from langchain_elasticsearch import ElasticsearchStore`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`from langchain.text_splitter import RecursiveCharacterTextSplitter`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`from langchain.docstore.document import Document`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`from googletrans import Translator # Translator for final polishing`
added frontend/backend 2024-10-12 12:08:12 +00:00
			`logging.basicConfig(level=logging.INFO)`
			`logger = logging.getLogger(__name__)`

translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Load configuration`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`config_file_path = "config.json"`
			`with open(config_file_path, 'r') as config_file:`
			`config = json.load(config_file)`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Load Mistral API key`
added frontend/backend 2024-10-12 12:08:12 +00:00			`mistral_api_key = "hXDC4RBJk1qy5pOlrgr01GtOlmyCBaNs"`
			`if not mistral_api_key:`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`raise ValueError("Mistral API key not found in configuration.")`


			`###############################################################################`
			`# Function to translate entire text to Slovak #`
			`###############################################################################`
			`translator = Translator()`

			`def translate_to_slovak(text: str) -> str:`
			`"""`
			`Translates the entire text into Slovak.`
			`Logs the text before and after translation.`
			`"""`
			`if not text.strip():`
			`return text`

			`try:`
			`# 1) Slovak (or any language) -> English`
			`mid_result = translator.translate(text, src='auto', dest='en').text`

			`# 2) English -> Slovak`
			`final_result = translator.translate(mid_result, src='en', dest='sk').text`

			`return final_result`
			`except Exception as e:`
			`logger.error(f"Translation error: {e}")`
			`return text # fallback to the original text`

added frontend/backend 2024-10-12 12:08:12 +00:00

translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`###############################################################################`
			`# Custom Mistral LLM #`
			`###############################################################################`
added frontend/backend 2024-10-12 12:08:12 +00:00			`class CustomMistralLLM:`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`def __init__(self, api_key: str, endpoint_url: str, model_name: str):`
added frontend/backend 2024-10-12 12:08:12 +00:00			`self.api_key = api_key`
			`self.endpoint_url = endpoint_url`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`self.model_name = model_name`
added frontend/backend 2024-10-12 12:08:12 +00:00
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`def generate_text(self, prompt: str, max_tokens=512, temperature=0.7, retries=3, delay=2):`
added frontend/backend 2024-10-12 12:08:12 +00:00			`headers = {`
			`"Authorization": f"Bearer {self.api_key}",`
			`"Content-Type": "application/json"`
			`}`
			`payload = {`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`"model": self.model_name,`
added frontend/backend 2024-10-12 12:08:12 +00:00			`"messages": [{"role": "user", "content": prompt}],`
			`"max_tokens": max_tokens,`
			`"temperature": temperature`
			`}`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`attempt = 0`
			`while attempt < retries:`
			`try:`
			`response = requests.post(self.endpoint_url, headers=headers, json=payload)`
			`response.raise_for_status()`
			`result = response.json()`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.info(f"Full response from model {self.model_name}: {result}")`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`return result.get("choices", [{}])[0].get("message", {}).get("content", "No response")`
			`except HTTPError as e:`
			`if response.status_code == 429: # Too Many Requests`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.warning(f"Rate limit exceeded. Waiting {delay} seconds before retry.")`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`time.sleep(delay)`
			`attempt += 1`
			`else:`
			`logger.error(f"HTTP Error: {e}")`
			`raise e`
			`except Exception as e:`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.error(f"Error: {str(e)}")`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`raise e`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`raise Exception("Reached maximum number of retries for API request")`
added frontend/backend 2024-10-12 12:08:12 +00:00

translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`###############################################################################`
			`# Initialize embeddings and Elasticsearch store #`
			`###############################################################################`
			`logger.info("Loading HuggingFaceEmbeddings model...")`
added frontend/backend 2024-10-12 12:08:12 +00:00			`embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2")`

new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`index_name = 'drug_docs'`
added frontend/backend 2024-10-12 12:08:12 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Connect to Elasticsearch`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`if config.get("useCloud", False):`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.info("Using cloud Elasticsearch.")`
			`cloud_id = "tt:dXMtZWFzdC0yLmF3cy5lbGFzdGljLWNsb3VkLmNvbTo0NDMkOGM3ODQ0ZWVhZTEyNGY3NmFjNjQyNDFhNjI4NmVhYzMkZTI3YjlkNTQ0ODdhNGViNmEyMTcxMjMxNmJhMWI0ZGU="`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`vectorstore = ElasticsearchStore(`
			`es_cloud_id=cloud_id,`
			`index_name='drug_docs',`
			`embedding=embeddings,`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`es_user="elastic",`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`es_password="sSz2BEGv56JRNjGFwoQ191RJ"`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`)`
			`else:`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.info("Using local Elasticsearch.")`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`vectorstore = ElasticsearchStore(`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`es_url="http://localhost:9200",`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`index_name=index_name,`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00			`embedding=embeddings,`
			`)`
added frontend/backend 2024-10-12 12:08:12 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.info(f"Connected to {'cloud' if config.get('useCloud', False) else 'local'} Elasticsearch.")`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00
			`###############################################################################`
			`# Initialize Mistral models (small & large) #`
			`###############################################################################`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`llm_small = CustomMistralLLM(`
			`api_key=mistral_api_key,`
			`endpoint_url="https://api.mistral.ai/v1/chat/completions",`
			`model_name="mistral-small-latest"`
			`)`

			`llm_large = CustomMistralLLM(`
added frontend/backend 2024-10-12 12:08:12 +00:00			`api_key=mistral_api_key,`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`endpoint_url="https://api.mistral.ai/v1/chat/completions",`
			`model_name="mistral-large-latest"`
added frontend/backend 2024-10-12 12:08:12 +00:00			`)`

new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`###############################################################################`
			`# Helper function to evaluate model output #`
			`###############################################################################`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`def evaluate_results(query, summaries, model_name):`
			`"""`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`Evaluates results by:`
			`- text length,`
			`- presence of query keywords, etc.`
			`Returns a rating and explanation.`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`"""`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`query_keywords = query.split()`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`total_score = 0`
			`explanation = []`

			`for i, summary in enumerate(summaries):`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Length-based scoring`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`length_score = min(len(summary) / 100, 10)`
			`total_score += length_score`
			`explanation.append(f"Document {i+1}: Length score - {length_score}")`

translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Keyword-based scoring`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`keyword_matches = sum(1 for word in query_keywords if word.lower() in summary.lower())`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`keyword_score = min(keyword_matches * 2, 10)`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`total_score += keyword_score`
			`explanation.append(f"Document {i+1}: Keyword match score - {keyword_score}")`

			`final_score = total_score / len(summaries) if summaries else 0`
			`explanation_summary = "\n".join(explanation)`

translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.info(f"Evaluation for model {model_name}: {final_score}/10")`
			`logger.info(f"Explanation:\n{explanation_summary}")`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00
			`return {"rating": round(final_score, 2), "explanation": explanation_summary}`


translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`###############################################################################`
			`# Main function: process_query_with_mistral (Slovak prompt) #`
			`###############################################################################`
added frontend/backend 2024-10-12 12:08:12 +00:00			`def process_query_with_mistral(query, k=10):`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.info("Processing query started.")`
added frontend/backend 2024-10-12 12:08:12 +00:00			`try:`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# --- Vector search ---`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`vector_results = vectorstore.similarity_search(query, k=k)`
			`vector_documents = [hit.metadata.get('text', '') for hit in vector_results]`

			`max_docs = 5`
			`max_doc_length = 1000`
			`vector_documents = [doc[:max_doc_length] for doc in vector_documents[:max_docs]]`

			`if vector_documents:`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Slovak prompt`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`vector_prompt = (`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`f"Otázka: '{query}'.\n"`
			`"Na základe nasledujúcich informácií o liekoch:\n"`
			`f"{vector_documents}\n\n"`
			`"Prosím, uveďte tri najvhodnejšie lieky alebo riešenia. Pre každý liek uveďte jeho názov a stručné, jasné vysvetlenie, prečo je vhodný. "`
			`"Odpovedajte priamo a ľudským, priateľským tónom v číslovanom zozname, bez nepotrebných úvodných fráz alebo opisu procesu. "`
			`"Odpoveď musí byť v slovenčine."`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`)`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`summary_small_vector = llm_small.generate_text(prompt=vector_prompt, max_tokens=700, temperature=0.7)`
			`summary_large_vector = llm_large.generate_text(prompt=vector_prompt, max_tokens=700, temperature=0.7)`

			`splitter = RecursiveCharacterTextSplitter(chunk_size=200, chunk_overlap=20)`
			`split_summary_small_vector = splitter.split_text(summary_small_vector)`
			`split_summary_large_vector = splitter.split_text(summary_large_vector)`

			`small_vector_eval = evaluate_results(query, split_summary_small_vector, 'Mistral Small')`
			`large_vector_eval = evaluate_results(query, split_summary_large_vector, 'Mistral Large')`
			`else:`
			`small_vector_eval = {"rating": 0, "explanation": "No results"}`
			`large_vector_eval = {"rating": 0, "explanation": "No results"}`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`summary_small_vector = ""`
			`summary_large_vector = ""`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# --- Text search ---`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`es_results = vectorstore.client.search(`
			`index=index_name,`
			`body={"size": k, "query": {"match": {"text": query}}}`
added frontend/backend 2024-10-12 12:08:12 +00:00			`)`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`text_documents = [hit['_source'].get('text', '') for hit in es_results['hits']['hits']]`
			`text_documents = [doc[:max_doc_length] for doc in text_documents[:max_docs]]`

			`if text_documents:`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Slovak prompt`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`text_prompt = (`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`f"Otázka: '{query}'.\n"`
			`"Na základe nasledujúcich informácií o liekoch:\n"`
			`f"{text_documents}\n\n"`
			`"Prosím, uveďte tri najvhodnejšie lieky alebo riešenia. Pre každý liek uveďte jeho názov a stručné, jasné vysvetlenie, prečo je vhodný. "`
			`"Odpovedajte priamo a ľudským, priateľským tónom v číslovanom zozname, bez nepotrebných úvodných fráz alebo opisu procesu. "`
			`"Odpoveď musí byť v slovenčine."`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`)`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`summary_small_text = llm_small.generate_text(prompt=text_prompt, max_tokens=700, temperature=0.7)`
			`summary_large_text = llm_large.generate_text(prompt=text_prompt, max_tokens=700, temperature=0.7)`
added frontend/backend 2024-10-12 12:08:12 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`split_summary_small_text = RecursiveCharacterTextSplitter(chunk_size=200, chunk_overlap=20).split_text(summary_small_text)`
			`split_summary_large_text = RecursiveCharacterTextSplitter(chunk_size=200, chunk_overlap=20).split_text(summary_large_text)`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`small_text_eval = evaluate_results(query, split_summary_small_text, 'Mistral Small')`
			`large_text_eval = evaluate_results(query, split_summary_large_text, 'Mistral Large')`
			`else:`
			`small_text_eval = {"rating": 0, "explanation": "No results"}`
			`large_text_eval = {"rating": 0, "explanation": "No results"}`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`summary_small_text = ""`
			`summary_large_text = ""`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Combine all results and pick the best`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`all_results = [`
			`{"eval": small_vector_eval, "summary": summary_small_vector, "model": "Mistral Small Vector"},`
			`{"eval": large_vector_eval, "summary": summary_large_vector, "model": "Mistral Large Vector"},`
			`{"eval": small_text_eval, "summary": summary_small_text, "model": "Mistral Small Text"},`
			`{"eval": large_text_eval, "summary": summary_large_text, "model": "Mistral Large Text"},`
			`]`

			`best_result = max(all_results, key=lambda x: x["eval"]["rating"])`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.info(f"Best result from model {best_result['model']} with score {best_result['eval']['rating']}.")`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`# Final translation to Slovak (with logs before/after)`
			`polished_answer = translate_to_slovak(best_result["summary"])`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00
			`return {`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`"best_answer": polished_answer,`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`"model": best_result["model"],`
			`"rating": best_result["eval"]["rating"],`
			`"explanation": best_result["eval"]["explanation"]`
			`}`
implemented cloud requesting elasticsearch and more through langchain 2024-10-22 13:39:09 +00:00
added frontend/backend 2024-10-12 12:08:12 +00:00			`except Exception as e:`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`logger.error(f"Error: {str(e)}")`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`return {`
translator, upd frontend, upd promts 2025-02-05 17:56:52 +00:00			`"best_answer": "An error occurred during query processing.",`
new frontend, evaluating functionality on BE, dockerFiles 2024-10-31 14:05:21 +00:00			`"error": str(e)`
			`}`