TEST-GIZ-Project-Search

Running on CPU Upgrade

App Files Files Community

annikwag commited on Mar 11

Commit

aebc985

verified ·

1 Parent(s): e25a980

Create rag_utils.py

Browse files

Files changed (1) hide show

appStore/rag_utils.py +126 -0

appStore/rag_utils.py ADDED Viewed

	@@ -0,0 +1,126 @@

+import re
+import requests
+import streamlit as st
+def truncate_to_tokens(text, max_tokens):
+    """
+    Truncate a text to an approximate token count by splitting on whitespace.
+    Args:
+        text (str): The text to truncate.
+        max_tokens (int): Maximum number of tokens/words to keep.
+    Returns:
+        str: The truncated text.
+    """
+    tokens = text.split()
+    if len(tokens) > max_tokens:
+        return " ".join(tokens[:max_tokens])
+    return text
+def build_context_for_result(res, compute_title_fn):
+    """
+    Build a context string (title + objective + description) from a search result.
+    Args:
+        res (dict): A result dictionary with 'payload' key containing metadata.
+        compute_title_fn (callable): Function to compute the title from metadata.
+    Returns:
+        str: Combined text from title, objective, and description.
+    """
+    metadata = res.payload.get('metadata', {})
+    title = metadata.get("title", compute_title_fn(metadata))
+    objective = metadata.get("objective", "")
+    desc_en = metadata.get("description.en", "").strip()
+    desc_de = metadata.get("description.de", "").strip()
+    description = desc_en if desc_en else desc_de
+    return f"{title}\n{objective}\n{description}"
+def highlight_query(text, query):
+    """
+    Highlight the query text in the given string with red/bold HTML styling.
+    Args:
+        text (str): The full text in which to highlight matches.
+        query (str): The substring (query) to highlight.
+    Returns:
+        str: The HTML-formatted string with highlighted matches.
+    """
+    pattern = re.compile(re.escape(query), re.IGNORECASE)
+    return pattern.sub(lambda m: f"<span style='color:red; font-weight:bold;'>{m.group(0)}</span>", text)
+def format_project_id(pid):
+    """
+    Format a numeric project ID into the typical GIZ format (e.g. '201940485' -> '2019.4048.5').
+    Args:
+        pid (str|int): The project ID to format.
+    Returns:
+        str: Formatted project ID if it has enough digits, otherwise the original string.
+    """
+    s = str(pid)
+    if len(s) > 5:
+        return s[:4] + "." + s[4:-1] + "." + s[-1]
+    return s
+def compute_title(metadata):
+    """
+    Compute a default title from metadata using name.en (or name.de if empty).
+    If an ID is present, append it in brackets.
+    Args:
+        metadata (dict): Project metadata dictionary.
+    Returns:
+        str: Computed title string or 'No Title'.
+    """
+    name_en = metadata.get("name.en", "").strip()
+    name_de = metadata.get("name.de", "").strip()
+    base = name_en if name_en else name_de
+    pid = metadata.get("id", "")
+    if base and pid:
+        return f"{base} [{format_project_id(pid)}]"
+    return base or "No Title"
+def get_rag_answer(query, top_results, endpoint, token):
+    """
+    Send a prompt to the LLM endpoint, including the context from top results.
+    Args:
+        query (str): The user question.
+        top_results (list): List of top search results from which to build context.
+        endpoint (str): The HuggingFace Inference endpoint URL.
+        token (str): The Bearer token (from st.secrets, for instance).
+    Returns:
+        str: The LLM-generated answer, or an error message if the call fails.
+    """
+    # Build the context
+    from appStore.rag_utils import truncate_to_tokens, build_context_for_result, compute_title
+    context = "\n\n".join([build_context_for_result(res, compute_title) for res in top_results])
+    context = truncate_to_tokens(context, 11500)  # Truncate to ~11.5k tokens
+    # Construct the prompt
+    prompt = (
+        "You are a project portfolio adviser at the development cooperation GIZ. "
+        "Using the following context, answer the question in English precisely. "
+        "Ensure that any project title mentioned in your answer is wrapped in ** (markdown bold). "
+        "Only output the final answer below, without repeating the context or question.\n\n"
+        f"Context:\n{context}\n\n"
+        f"Question: {query}\n\n"
+        "Answer:"
+    )
+    headers = {"Authorization": f"Bearer {token}"}
+    payload = {"inputs": prompt, "parameters": {"max_new_tokens": 300}}
+    response = requests.post(endpoint, headers=headers, json=payload)
+    if response.status_code == 200:
+        result = response.json()
+        answer = result[0].get("generated_text", "")
+        if "Answer:" in answer:
+            answer = answer.split("Answer:")[-1].strip()
+        return answer
+    else:
+        return f"Error in generating answer: {response.text}"