Add provider templates, scripts for syncing and embedding, and test cases

- Created a template for providers.yaml to define API providers and models. - Added a new providers.yaml file with initial provider configurations. - Implemented fix_things.py to update chunk documents in ArangoDB. - Developed make_arango_embeddings.py to generate embeddings for talks and store them in ArangoDB. - Introduced sync_talks.py to synchronize new speeches from riksdagen.se and process them. - Added notes.md for documentation on riksdagsgruppen login details. - Created test_make_arango_embeddings.py for integration testing of embedding generation. - Implemented test_gpu.py to test image input handling with vLLM.
3 weeks ago · 88e0244429
parent 3ba8c3340a
commit 88e0244429
37 changed files with 2282 additions and 373 deletions
--- a/20240201-113043-pivpnwgbackup.tgz
+++ b/20240201-113043-pivpnwgbackup.tgz
--- a/10
+++ b/10
@ -1,4 +1,4 @@
-.PHONY: frontend backend reload nginx
+.PHONY: frontend backend reload nginx install-sync

 # install deps and build the React app
 frontend:
@ -14,3 +14,11 @@ nginx:

 # build everything and reload nginx
 all: frontend nginx
+
+# install and enable the daily sync timer
+install-sync:
+	sudo cp etc/riksdagen-sync.service /etc/systemd/system/
+	sudo cp etc/riksdagen-sync.timer /etc/systemd/system/
+	sudo systemctl daemon-reload
+	sudo systemctl enable --now riksdagen-sync.timer
+	@echo "Timer installed. Check status with: systemctl list-timers | grep riksdagen"
--- a/_chromadb/chroma_client.py
+++ b/_chromadb/chroma_client.py
@ -13,12 +13,17 @@ from config import chromadb_path, embedding_model
 import re
 from typing import Dict, List, Any, Tuple, Optional
 from chromadb.utils.embedding_functions import OllamaEmbeddingFunction
+from chromadb.utils.embedding_functions import OllamaEmbeddingFunction
+

+from env_manager import set_env
+set_env()
 class ChromaClient:
    def __init__(self, path: str | None = chromadb_path):
        self.path: str = path
        self._client: ClientAPI = self._init_client()
-        self.embedding_function = OllamaEmbeddingFunction(model_name=embedding_model, url='192.168.1.10:33405')
+        embedding_url = os.getenv('LLM_EMBEDDINGS_PORT', '192.168.1.12:33405')
+        self.embedding_function = OllamaEmbeddingFunction(model_name=embedding_model, url=embedding_url)

    def _init_client(self) -> chromadb.PersistentClient:
        return chromadb.PersistentClient(path=self.path)
@ -308,8 +313,8 @@ chroma_db = ChromaClient()
 if __name__ == "__main__":
   
    collection = chroma_db.get_collection(os.getenv("CHROMA_TALK_COLLECTION"))
-    print(collection.count())
-    query = 'betyg grundskola'
+    query = 'betyg grundskola uppförande'
+    print(f"Querying for: {query}")
    results = chroma_db.query_collection(
        collection=collection,
        query_texts=query,
@ -317,15 +322,3 @@ if __name__ == "__main__":
    )
    for res in results:
        print(res['document'])
-    print('---')
-    col: Collection = chroma_db.get_collection(os.getenv("CHROMA_TALK_COLLECTION"))
-    print(col.get(limit=10))
-    results = col.query(query_texts=query, n_results=3)
-    for i in zip(
-        results['metadatas'][0],
-        results['documents'][0],
-        results['distances'][0],
-        results['ids'][0],
-    ):
-        print(i)
-
--- a/arango_client.py
+++ b/arango_client.py
@ -1,7 +1,37 @@
-from _arango._arango import Arango
 import os
+from typing import List
+
+from ollama import Client
+from arango.collection import Collection
+
+from _arango._arango import Arango
+
+
+class CustomArango(Arango):
+    def __init__(self, db_name = 'riksdagen', user=None, password=None):
+        super().__init__(db_name, user, password)
+

-arango = Arango(
+    def make_embeddings(self, texts: List[str]) -> List[List[float]]:
+        """
+        Generate embeddings for a list of texts using Ollama.
+
+        Args:
+            texts (List[str]): List of text strings to embed.
+
+        Returns:
+            List[List[float]]: List of embedding vectors.
+        """
+        ollama_client = Client(host='192.168.1.12:33405')
+
+        embeddings = ollama_client.embed(
+            model="qwen3-embedding:latest",
+            input=texts,
+            dimensions=384
+        )
+        return embeddings.embeddings
+
+arango = CustomArango(
    db_name="riksdagen",
    user='riksdagen',
    password=os.getenv("ARANGO_PWD"),
@ -9,4 +39,23 @@ arango = Arango(


 if __name__ == "__main__":
-    print(arango.db.collections())
+
+    embeddings = arango.make_embeddings(["Vilka åtgärder bör vidtas för att hantera klimatförändringar?"])
+    query = """LET query = @query_embedding
+
+FOR doc IN chunks
+  LET score = APPROX_NEAR_COSINE(doc.embedding, query)
+  SORT score DESC
+  LIMIT 5
+  RETURN {
+    _key: doc._key,
+    debate: doc.debate,
+    text: doc.text,
+    similarity: score
+  }
+  """
+    result = arango.db.aql.execute(query=query, bind_vars={"query_embedding": embeddings[0]})
+    for doc in result:
+        print(doc)
+        print('---')
+
--- a/backend/app.py
+++ b/backend/app.py
@ -161,7 +161,8 @@ async def get_talk(talk_id: str) -> dict:
        "anforande_nummer",
        "replik",
        "url_session",
-        "url_audio"
+        "url_audio",
+        "summary"
    ]
    )

--- a/backend/services/chat.py
+++ b/backend/services/chat.py
@ -69,9 +69,20 @@ You can only request a tool use, not use it directly. After you request a tool,
 **When giving your final answer:**
 - Always start with a short summary of your findings, before any detailed analysis or tables.
 - Respond concisely, the user is not here for small talk. 
- Make sure to include sources for your answer, but don't use the internal _id or chunk_index fields; instead, use date, title, etc. 
- When refering to a source, use foot notes like [1], [2], etc. at the end of the sentence where you mention it. *Remember to include a short bibliography at the end of your answer, listing all sources you used.*
- Always format your final answer using Markdown (it will be translated to HTML by the frontend).
+- **IMPORTANT: Always format your answer using Markdown.** The frontend will convert it to HTML automatically.
+- **IMPORTANT: Use inline citation numbers for ALL source citations.** Use the format `[1]`, `[2]`, etc. directly after the statement that references the source.
+- **CRITICAL: Citations must be plain square brackets with numbers inside: `[1]`, `[2]`, `[3]`. Do NOT use Markdown footnote syntax like `[^1]` or special Unicode brackets like `【1】`.**
+- **IMPORTANT: Always include a "Källor" (Sources) section at the end** with a numbered list matching your citations. Format each source as: `[1] Speaker name – Date – Brief context or quote`
+- Example of correct citation format:
+  ```
+  ROT-avdraget infördes 2009[1] och hade som syfte att minska svartarbete[2].
+
+  ## Källor
+  [1] Eva Andersson – 2009-01-15 – Debatt om ROT-avdrag
+  [2] Per Svensson – 2009-02-20 – Diskussion om byggbranschen
+  ```
+- Make sure citation numbers are sequential ([1], [2], [3]...) and that every citation has a matching entry in the Källor section.
+- Don't use internal _id or chunk_index fields in your answer; use human-readable information (speaker, date, topic).
 - Don't ever make up quotes or facts; if you don't have enough information, say that you don't know, or call another tool to find more information.
 - Answer in Swedish.
    """
@ -198,10 +209,11 @@ You can only request a tool use, not use it directly. After you request a tool,
            # This avoids issues if there are multiple ChatCompletionMessage classes in the project

            # The following code should NOT be inside the if-block!
-            try:
-                print_blue("Thinking:", response.reasoning_content)
-            except Exception as e:
-                print_red(f"[ChatService] Error printing thinking response: {e}")
+            # Use getattr so this doesn't raise AttributeError when the model
+            # doesn't return a reasoning/thinking block (which is the normal case).
+            thinking = getattr(response, "reasoning_content", None)
+            if thinking:
+                print_blue("Thinking:", thinking)
            try:    
                print_purple("Content:", response.content)
            except Exception as e:
@ -209,11 +221,12 @@ You can only request a tool use, not use it directly. After you request a tool,

            tool_calls = getattr(response, "tool_calls", None)
            if tool_calls:
-                if response.reasoning_content:
-                    if isinstance(response.reasoning_content, dict) and "content" in response.reasoning_content:
-                        reasoning_content = response.reasoning_content["content"]
+                reasoning_content_attr = getattr(response, "reasoning_content", None)
+                if reasoning_content_attr:
+                    if isinstance(reasoning_content_attr, dict) and "content" in reasoning_content_attr:
+                        reasoning_content = reasoning_content_attr["content"]
                    else:
-                        reasoning_content = str(response.reasoning_content)
+                        reasoning_content = str(reasoning_content_attr)
                    current_messages.append(
                        {
                            "role": "assistant",
@ -319,7 +332,7 @@ You can only request a tool use, not use it directly. After you request a tool,
                                f"{tool_result_string[:12000]} (...) [truncated]"
                            )

-                    reminder = '\n\n**Remember that you can only use the information you get using the tools when giving your final answer. Do not make up any facts or quotes. If you do not have enough information, say that you do not know, or call another tool to find more information. Always give you final answer in Swedish.**'
+                    reminder = '\n\n**Remember:**\n- You can only use information from tool results when giving your final answer.\n- Do not make up facts or quotes.\n- If you lack information, say so or call another tool.\n- **Always use inline citations in the format [1], [2], [3] etc. Do NOT use [^1] or 【1】.**\n- **Always include a "Källor" section at the end with matching numbered sources.**\n- Always format your final answer in Markdown.\n- Always answer in Swedish.'
                    tool_message = {
                        "role": "tool",
                        "name": tool_name,
@ -338,7 +351,11 @@ You can only request a tool use, not use it directly. After you request a tool,
                continue
            elif response.content:
                final_content = getattr(response, "content", "")
-                return final_content, collected_tables, active_focus_ids
+                final_message = FinalAnswer(
+                    final_answer=final_content,
+                    explanation="Model provided a direct answer without requiring additional tools."
+                )
+                return final_message, collected_tables, active_focus_ids


    def _get_tool_function(self, tool_name: str):
--- a/backend/services/llm_tools.py
+++ b/backend/services/llm_tools.py
@ -8,22 +8,114 @@ from arango_client import arango
 from arango.exceptions import AQLQueryExecuteError
 from backend.services.search import (
    SearchService,
-)  # Import SearchService for use in the tool
+)
 from utils import detect_sql_syntax
 from _llm import LLM
 from pydantic import BaseModel, Field

-# * When to use an AQL tool vs vector/semantic search*
-# - Use AQL for exact predicates, structured filters, joins, grouping, aggregations,
-#   date-range queries, or ArangoSearch indexed text search.
-#   Examples:
-#     • Exact matches (by id, date, party, speaker).
-#     • Aggregations (counts, sums, min/max) and grouping (COLLECT).
-#     • Joins across collections with nested FOR.
-#     • Range queries, pagination, sorted results and server-side window functions.
-# - Prefer vector/semantic search when you need fuzzy or semantic similarity
-#   (e.g., "find speeches similar in meaning to this paragraph"). Vector search is
-#   complementary to AQL, not a replacement for structured queries.
+
+class HitDocument(BaseModel):
+    """
+    HitDocument is a Pydantic model that provides a normalized representation of a search hit across various tools, enabling consistent downstream handling.
+
+    Attributes:
+        id (Optional[str]): Fully qualified ArangoDB document identifier.
+        key (Optional[str]): Document key without collection prefix.
+        speaker (Optional[str]): Name of the speaker associated with the hit.
+        party (Optional[str]): Party affiliation of the speaker.
+        date (Optional[str]): ISO formatted document date (YYYY-MM-DD).
+        snippet (Optional[str]): Contextual snippet or highlight from the document.
+        text (Optional[str]): Full text of the document when available.
+        score (Optional[float]): Relevance score supplied by the executing tool.
+        metadata (Dict[str, Any]): Additional metadata specific to the originating tool that should be preserved.
+
+    Methods:
+        to_string() -> str:
+            Renders the hit as a human-readable string with uppercase labels, including all present fields and metadata.
+    """
+
+    """Normalized representation of a search hit across tools to enable consistent downstream handling."""
+    id: Optional[str] = Field(
+        default=None, description="Fully qualified ArangoDB document identifier."
+    )
+    key: Optional[str] = Field(
+        default=None, description="Document key without collection prefix."
+    )
+    speaker: Optional[str] = Field(
+        default=None, description="Name of the speaker associated with the hit."
+    )
+    party: Optional[str] = Field(
+        default=None, description="Party affiliation of the speaker."
+    )
+    date: Optional[str] = Field(
+        default=None, description="ISO formatted document date (YYYY-MM-DD)."
+    )
+    snippet: Optional[str] = Field(
+        default=None, description="Contextual snippet or highlight from the document."
+    )
+    text: Optional[str] = Field(
+        default=None, description="Full text of the document when available."
+    )
+    score: Optional[float] = Field(
+        default=None, description="Relevance score supplied by the executing tool."
+    )
+    metadata: Dict[str, Any] = Field(
+        default_factory=dict,
+        description="Additional metadata specific to the originating tool that should be preserved.",
+    )
+
+    def to_string(self, include_metadata: bool = True) -> str:
+        """
+        Render the object as a human-readable string with uppercase labels.
+
+        Args:
+            include_metadata (bool, optional): Whether to include metadata fields in the output. Defaults to True.
+
+        Returns:
+            str: A formatted string representation of the object, with each field and its value separated by double newlines, and field names in uppercase.
+        """
+        data: Dict[str, Any] = self.model_dump(exclude_none=True)
+        metadata: Dict[str, Any] = data.pop("metadata", {})
+        segments: List[str] = []
+        for field_name, field_value in data.items():
+            segments.append(f"{field_name.upper()}\n{field_value}")
+        for meta_key, meta_value in metadata.items():
+            segments.append(f"{meta_key.upper()}\n{meta_value}")
+        return "\n\n".join(segments)
+
+
+class HitsResponse(BaseModel):
+    """
+    HitsResponse is a Pydantic model that serves as a container for multiple HitDocument instances, providing utility methods for formatting and rendering the collection.
+
+    Attributes:
+        hits (List[HitDocument]): A list of collected search hits.
+
+    Methods:
+        to_string() -> str:
+            Returns a string representation of all hits, separated by a visual divider. If there are no hits, returns an empty string.
+    """
+
+    hits: List[HitDocument] = Field(
+        default_factory=list, description="Collected search hits."
+    )
+
+    def to_string(self, include_metadata=True) -> str:
+        """
+        Render all hits as a single string, separated by a visual divider.
+
+        Args:
+            include_metadata (bool, optional): Whether to include metadata in each hit's string representation. Defaults to True.
+
+        Returns:
+            str: A single string containing all hits, separated by "\n\n---\n\n". Returns an empty string if there are no hits.
+        """
+        """Render all hits as a single string separated by a visual divider."""
+        if not self.hits:
+            return ""
+        return "\n\n---\n\n".join(
+            hit.to_string(include_metadata=include_metadata) for hit in self.hits
+        )


@register_tool()
@ -54,12 +146,15 @@ def search_documents(query: str):
    class AQLResponseModel(BaseModel):
        query: str = Field(..., description="The generated AQL query string.")
        output_explanation: str = Field(
-            ..., description="A *very* short explanation of the expected output format, and how to interpret the results.",
-            examples=["Using COUNT INTO c, the result is a single integer count of matching documents.",]
+            ...,
+            description="A *very* short explanation of the expected output format, and how to interpret the results.",
+            examples=[
+                "Using COUNT INTO c, the result is a single integer count of matching documents.",
+            ],
        )

    tools = get_tools(specific_tools=["aql_query"])
-    aql_query_description = tools[0]['function']['description']
+    aql_query_description = tools[0]["function"]["description"]

    system_message = f"""You are an expert in converting natural language queries into AQL (ArangoDB Query Language) queries for the Riksdagen database. 
 The user will provide a query in natural language, and you must translate it into a valid AQL query that can be executed against the database.
@ -127,7 +222,9 @@ Write AQL queries for reading data using only the allowed keywords and patterns
    query = response.content.query
    output_explanation = response.content.output_explanation
    result = aql_query(query)
-    if len(result) == 1: #TODO Is it a good idea to return as a single item if only one item?
+    if (
+        len(result) == 1
+    ):  # TODO Is it a good idea to return as a single item if only one item?
        result = result[0]

    result = f"The AQL used to answer your request was:\n```\n{query}\n```\n{output_explanation}\n\nThe result of the query is:\n{result}"
@ -137,18 +234,18 @@ Write AQL queries for reading data using only the allowed keywords and patterns
@register_tool()
 def aql_query(query: str) -> List[Dict[str, Any]]:

-
-    def remove_fields(doc: Dict[str, Any], fields_to_remove: List[str]) -> Dict[str, Any]:
+    def remove_fields(
+        doc: Dict[str, Any], fields_to_remove: List[str]
+    ) -> Dict[str, Any]:
        """Recursively remove specified fields from a document."""
        if not isinstance(doc, dict):
            return doc
-        
+
        for key in list(doc.keys()):
            if key in fields_to_remove:
                del doc[key]

        return doc
-            

    """
    Execute a read-only AQL query against the Riksdag talks database.
@ -257,7 +354,9 @@ def aql_query(query: str) -> List[Dict[str, Any]]:
    try:
        docs = []
        for doc in arango.execute_aql(query):
-            docs.append(remove_fields(doc, ['chunks'])) #TODO And other fields to remove?
+            docs.append(
+                remove_fields(doc, ["chunks"])
+            )  # TODO And other fields to remove?
        return docs

    except AQLQueryExecuteError as e:
@ -312,7 +411,9 @@ def aql_query(query: str) -> List[Dict[str, Any]]:
        try:
            docs = []
            for doc in arango.execute_aql(query):
-                docs.append(remove_fields(doc, ['chunks'])) #TODO And other fields to remove?
+                docs.append(
+                    remove_fields(doc, ["chunks"])
+                )  # TODO And other fields to remove?
            return docs
        except AQLQueryExecuteError as e2:
            print_red(f"[Tools] Still got AQL execution error after rewrite: {str(e2)}")
@ -324,150 +425,130 @@ def aql_query(query: str) -> List[Dict[str, Any]]:
                return f"ERROR executing AQL query: {str(e)}.\nPlease see the aql_query tool documentation for correct usage and examples!"
    except Exception as e:
        import traceback
+
        tb = traceback.format_exc()
        print_red(f"[Tools] Unexpected error executing AQL query: {str(e)}\n{tb}")
        return f"ERROR executing AQL query: {str(e)}.\nPlease see the aql_query tool documentation for correct usage and examples!"


@register_tool()
-def vector_search_talks(query: str, limit: int = 8) -> List[Dict[str, Any]]:
+def vector_search_talks(query: str, limit: int = 8) -> str:
    """
-    Använd det här verktyget för att göra en semantisk sökning bland anföranden i Riksdagen.
-    Använd när du vill:
-    - Hitta relevanta anföranden baserat på innebörden i en fråga eller ett ämne.
-    - Få sammanfattningar eller utdrag från anföranden som är relaterade till en specifik fråga.
-    - Söka tematiskt snarare än med exakta nyckelord.
-    När du genererar query-parametern, försök att formulera den som en naturlig språkfråga eller ett uttalande som fångar det du vill veta.
+    Semantic search among speeches in the Riksdagen database.

    Args:
-        query: The user's question.
-        limit: Number of hits to return. Default 8.
+        query (str): The user's question.
+        limit (int): Number of hits to return. Default 8.

    Returns:
-        List of speech snippets most relevant to the query.
+        str: Formatted string containing the top hits separated by dividers.
    """
    print_yellow(f"[Tools] vector_search_talks → query='{query}' (top_k={limit}).")
-    collection = chroma_db.get_collection(os.getenv("CHROMA_TALK_COLLECTION"))
-    results = collection.query(
-        query_texts=[query],
-        n_results=limit,
-    )
-
-    metadatas = results.get("metadatas") or []
-    documents = results.get("documents") or []
-    ids = results.get("ids") or []
-    distances = results.get("distances") or []

-    metadata_rows = metadatas[0] if metadatas else []
-    document_rows = documents[0] if documents else []
-    id_rows = ids[0] if ids else []
-    distance_rows = distances[0] if distances else []
-
-    def _as_int(value: Any, default: int = -1) -> int:
-        """
-        Normalize chunk indices returned by Chroma so downstream Pydantic validation succeeds.
-        """
-        if isinstance(value, bool):
-            return default
-        if isinstance(value, int):
-            return value
-        if isinstance(value, float) and value.is_integer():
-            return int(value)
-        if isinstance(value, str):
-            stripped = value.strip()
-            if stripped.startswith("+"):
-                stripped = stripped[1:]
-            if stripped.lstrip("-").isdigit():
-                return int(stripped)
-        return default
-
-    max_len = max(
-        len(metadata_rows),
-        len(document_rows),
-        len(id_rows),
-        len(distance_rows),
-        0,
+    embeddings = arango.make_embeddings([query])[0]
+    query = """
+    LET query = @query_embedding
+
+    FOR doc IN chunks
+    LET score = APPROX_NEAR_COSINE(doc.embedding, query)
+    SORT score DESC
+    LIMIT 5
+    RETURN {
+        text: doc.text,
+        parent_id: doc.parent_id,
+        collection: doc.collection,
+        index: doc.index,
+        score: score
+    }
+    """
+    results = list(
+        arango.execute_aql(
+            query=query, bind_vars={"query_embedding": embeddings}, batch_size=limit
+        )
    )
-
-    hits: List[Dict[str, Any]] = []
-    for idx in range(max_len):
-        metadata = metadata_rows[idx] if idx < len(metadata_rows) else {}
-        if not isinstance(metadata, dict):
-            metadata = {}
-        _id = metadata.get("_id") or (id_rows[idx] if idx < len(id_rows) else None)
-        if not _id:
-            continue
-        chunk_index_raw = (
-            metadata.get("chunk_index")
-            or metadata.get("index")
-            or metadata.get("chunkId")
+    parent_ids = [doc["parent_id"] for doc in results]
+    parent_docs = fetch_documents(
+        parent_ids, fields=["_id", "_key", "talare", "parti", "dok_datum", "chunks"]
+    )
+    hits: List[HitDocument] = []
+    for n in range(len(results)):
+        chunks_doc = results[n]
+        parent_doc = parent_docs[n]
+        parent_chunks = parent_doc["chunks"]
+        chunk_index = chunks_doc["index"]
+
+        # Build snippet from neighboring chunks, extracting the 'text' field from each chunk dict
+        snippet_segments: List[str] = []
+
+        def get_chunk_text(chunk: Any) -> str:
+            """Helper to extract text from a chunk dict or return the string itself."""
+            if isinstance(chunk, dict):
+                return chunk.get("text", "")
+            elif isinstance(chunk, str):
+                return chunk
+            return str(chunk)
+
+        if chunk_index > 0:
+            snippet_segments.append(get_chunk_text(parent_chunks[chunk_index - 1]))
+        snippet_segments.append(get_chunk_text(chunks_doc))  # current chunk
+        if chunk_index < len(parent_chunks) - 1:
+            snippet_segments.append(get_chunk_text(parent_chunks[chunk_index + 1]))
+
+        hits.append(
+            HitDocument(
+                id=parent_doc.get("_id"),
+                key=parent_doc.get("_key"),
+                speaker=parent_doc.get("talare"),
+                party=parent_doc.get("parti"),
+                date=parent_doc.get("dok_datum"),
+                snippet=" ".join(snippet_segments),
+                score=chunks_doc.get("score"),
+                metadata={
+                    "collection": chunks_doc.get("collection"),
+                    "parent_id": chunks_doc.get("parent_id"),
+                    "chunk_index": chunk_index,
+                },
+            )
        )
-        chunk_index = _as_int(chunk_index_raw)
-        snippet_candidates: List[str] = []
-        for candidate in (
-            metadata.get("snippet"),
-            metadata.get("text"),
-            document_rows[idx] if idx < len(document_rows) else "",
-        ):
-            if isinstance(candidate, str) and candidate.strip():
-                snippet_candidates.append(candidate.strip())
-        snippet = snippet_candidates[0] if snippet_candidates else ""
-        hit = {
-            "_id": _id,
-            "_id": _id,
-            "chunk_index": chunk_index,
-            "heading": metadata.get("heading") or metadata.get("title") or metadata.get("talare"),
-            "snippet": snippet,
-            "debateurl": metadata.get("debateurl") or metadata.get("debate_url"),
-            "score": distance_rows[idx] if idx < len(distance_rows) else None,
-        }
-        hits.append(hit)
-    print_purple(f"[Tools] vector_search_talks assembled {len(hits)} hits.")
-    return hits
+    return HitsResponse(hits=hits).to_string()


@register_tool()
-def fetch_documents(_ids: list[str], collection: str = None, fields: dict = {}) -> list[Dict[str, Any]]:
-    """    
-    Fetches documents from the database by their IDs, with optional collection prefix and field filtering.
+def fetch_documents(_ids: list[str], collection: str = "", fields: list = []) -> str:
+    """
+    Fetches full documents by their _id from ArangoDB.

    Args:
-        _ids (list[str]): List of document IDs to fetch. If a single ID is provided, it will be converted to a list.
-        collection (str, optional): Collection name to prefix to IDs if not already present. Defaults to None.
-        fields (dict, optional): Dictionary specifying which fields to include in the returned documents. If empty, all fields are returned. Defaults to {}.
+        _ids: List of document IDs (e.g., ["talks/abc123", "talks/def456"])
+        collection: Optional collection name (not used, kept for compatibility)
+        fields: Optional list to specify which fields to return

-    Returns:
-        list[Dict[str, Any]]: List of documents fetched from the database. If 'fields' is specified, only those fields are included in each document.
+    Note:
+    - If `collection` is provided, it will be prepended to any IDs in `_ids` that do not already contain a collection prefix.
+    - If collection is `talks` and fields is empty, the `chunks` field will be removed from the returned documents to reduce payload size.

-    Raises:
-        ValueError: If document IDs do not include the collection prefix and no collection is specified.
-        """
+    Returns:
+        JSON string with document data or error message
+    """
+    # Check that collection is provided or items in _ids contain collection prefix
+    assert collection or all(
+        "/" in i for i in _ids
+    ), "Either collection must be provided or _ids must contain collection prefix."

+    if collection:
+        l = []
+        for i in _ids:
+            if "/" not in i:
+                l.append(f"{collection}/{i}")
+            else:
+                l.append(i)

-    if not isinstance(_ids, list):
-        if isinstance(_ids, str):
-            if '[' in _ids and ']' in _ids:
-                import json
-                try:
-                    _ids = json.loads(_ids)
-                except Exception as e:
-                    print_red(f"[Tools] Error parsing _ids as JSON list: {str(e)}. Treating as single ID.")
-                    _ids = [_ids]
-        _ids = [_ids]
-
-    _ids = [_id.replace('\\', "/") for _id in _ids]
-    if collection and '/' not in _ids[0]:
-        _ids = [f"{collection}/{_id.split('/')[-1]}" for _id in _ids]
-    elif '/' not in _ids[0]:
-        return f"ERROR FROM TOOL: When fetching documents by _id, you **must** include the collection prefix (e.g., 'talks/12345'). Or specify the collection parameter."
-
-    query = f"""
+    query = """
    FOR id IN @document_ids
        RETURN DOCUMENT(id)
    """
-    document_ids_string = f"""[{",".join(f'"{_id}"' for _id in _ids)}]"""
-    print_blue(f"[Tools] Fetch {query}, bind_vars={{'document_ids': {document_ids_string}}}")
-    docs = arango.execute_aql(query, bind_vars={"document_ids": document_ids_string})
+
+    docs = arango.execute_aql(query, bind_vars={"document_ids": _ids})

    if fields:
        l = []
@ -478,7 +559,6 @@ def fetch_documents(_ids: list[str], collection: str = None, fields: dict = {})
    else:
        for _id in _ids:
            if _id.startswith("talks/"):
-                # If fetching a talk, also fetch its chunks
                for doc in docs:
                    if "chunks" in doc:
                        del doc["chunks"]
@ -575,7 +655,7 @@ def arango_search(

    **This tools has four special features/parameters:**
    1) `return_snippets=True` – If you want to get an overview of the results, use this parameter to get highlighted snippets instead of full documents. This is useful if you want to quickly see what the results are about, and then decide which _id:s to fetch in full.
-    2) `results_to_user=True` – If the user has asked for e.g. "a list of talks mentioning...", "I want to see...", "give me all speeches about..." – or in other ways indicates they want to see the actual results – use this parameter so the results are sent to the user as they are.
+    2) `results_to_user=True` – If the user has asked for e.g. "a list of talks mentioning...", "I want to see...", "give me all speeches about..." – or in other ways indicates they want to see the actual results – use this parameter so the results are sent to the user.
    3) `focus_ids` – If you want to do a search within the ID:s from the last search, set this parameter to True. This is only useful if you have done a previous where you've used `results_to_user=True`, and the user has then asked a follow-up question that requires a more specific search within the previous results.
    4) `intressent_ids` – If you want to filter the search by specific speaker IDs, use this parameter. It should be a list of speaker IDs (intressent_id).

@ -643,12 +723,16 @@ def arango_search(
    focus_id_list: List[str] = []
    if focus_ids:
        if isinstance(focus_ids, list):
-            focus_id_list = [str(item) for item in focus_ids if isinstance(item, (str, int))]
+            focus_id_list = [
+                str(item) for item in focus_ids if isinstance(item, (str, int))
+            ]
        elif isinstance(focus_ids, str):
            try:
                parsed = json.loads(focus_ids)
                if isinstance(parsed, list):
-                    focus_id_list = [str(item) for item in parsed if isinstance(item, (str, int))]
+                    focus_id_list = [
+                        str(item) for item in parsed if isinstance(item, (str, int))
+                    ]
            except json.JSONDecodeError:
                focus_id_list = [focus_ids]
        elif focus_ids is True:
--- a/backend/services/monitor_script.py
+++ b/backend/services/monitor_script.py
@ -0,0 +1,144 @@
+#!/usr/bin/env python3
+"""
+System Resource Monitor - Logs system stats to help diagnose SSH connectivity issues.
+
+This script monitors:
+- CPU usage
+- Memory usage
+- Disk usage
+- Network connectivity
+- SSH service status
+- System load
+- Active connections
+
+Run continuously to capture when the system becomes unreachable.
+"""
+
+import psutil
+import time
+import logging
+from datetime import datetime
+from pathlib import Path
+
+# Setup logging to file with rotation
+log_file = Path("/var/log/system_monitor.log")
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(levelname)s - %(message)s',
+    handlers=[
+        logging.FileHandler(log_file),
+        logging.StreamHandler()  # Also print to console
+    ]
+)
+
+def check_ssh_service() -> dict:
+    """
+    Check if SSH service is running.
+    
+    Returns:
+        dict: Service status information
+    """
+    try:
+        import subprocess
+        result = subprocess.run(
+            ['systemctl', 'is-active', 'ssh'],
+            capture_output=True,
+            text=True,
+            timeout=5
+        )
+        return {
+            'running': result.returncode == 0,
+            'status': result.stdout.strip()
+        }
+    except Exception as e:
+        return {'running': False, 'error': str(e)}
+
+def get_system_stats() -> dict:
+    """
+    Collect current system statistics.
+    
+    Returns:
+        dict: System statistics including CPU, memory, disk, network
+    """
+    # CPU usage
+    cpu_percent = psutil.cpu_percent(interval=1)
+    cpu_count = psutil.cpu_count()
+    
+    # Memory usage
+    memory = psutil.virtual_memory()
+    swap = psutil.swap_memory()
+    
+    # Disk usage
+    disk = psutil.disk_usage('/')
+    
+    # Network stats
+    net_io = psutil.net_io_counters()
+    
+    # System load (1, 5, 15 minute averages)
+    load_avg = psutil.getloadavg()
+    
+    # Number of connections
+    connections = len(psutil.net_connections())
+    
+    return {
+        'cpu_percent': cpu_percent,
+        'cpu_count': cpu_count,
+        'memory_percent': memory.percent,
+        'memory_available_gb': memory.available / (1024**3),
+        'swap_percent': swap.percent,
+        'disk_percent': disk.percent,
+        'disk_free_gb': disk.free / (1024**3),
+        'network_bytes_sent': net_io.bytes_sent,
+        'network_bytes_recv': net_io.bytes_recv,
+        'load_1min': load_avg[0],
+        'load_5min': load_avg[1],
+        'load_15min': load_avg[2],
+        'connections': connections
+    }
+
+def monitor_loop(interval_seconds: int = 60):
+    """
+    Main monitoring loop that logs system stats at regular intervals.
+    
+    Args:
+        interval_seconds: How often to log stats (default: 60 seconds)
+    """
+    logging.info("Starting system monitoring...")
+    
+    while True:
+        try:
+            stats = get_system_stats()
+            ssh_status = check_ssh_service()
+            
+            # Log current stats
+            log_message = (
+                f"CPU: {stats['cpu_percent']:.1f}% | "
+                f"MEM: {stats['memory_percent']:.1f}% ({stats['memory_available_gb']:.2f}GB free) | "
+                f"DISK: {stats['disk_percent']:.1f}% ({stats['disk_free_gb']:.2f}GB free) | "
+                f"LOAD: {stats['load_1min']:.2f} {stats['load_5min']:.2f} {stats['load_15min']:.2f} | "
+                f"CONN: {stats['connections']} | "
+                f"SSH: {ssh_status.get('status', 'unknown')}"
+            )
+            
+            # Warning thresholds
+            if stats['cpu_percent'] > 90:
+                logging.warning(f"HIGH CPU! {log_message}")
+            elif stats['memory_percent'] > 90:
+                logging.warning(f"HIGH MEMORY! {log_message}")
+            elif stats['disk_percent'] > 90:
+                logging.warning(f"HIGH DISK USAGE! {log_message}")
+            elif stats['load_1min'] > stats['cpu_count'] * 2:
+                logging.warning(f"HIGH LOAD! {log_message}")
+            elif not ssh_status.get('running'):
+                logging.error(f"SSH SERVICE DOWN! {log_message}")
+            else:
+                logging.info(log_message)
+            
+            time.sleep(interval_seconds)
+            
+        except Exception as e:
+            logging.error(f"Error in monitoring loop: {e}")
+            time.sleep(interval_seconds)
+
+if __name__ == "__main__":
+    monitor_loop(interval_seconds=60)  # Log every 60 seconds
--- a/config.py
+++ b/config.py
@ -6,7 +6,7 @@ embedding_model = os.getenv("LLM_MODEL_EMBEDDINGS")
 if embedding_model == "embeddinggemma":
    embedding_dimensions = 768
 else:
-    embedding_dimensions = None
+    embedding_dimensions = 384
 _llm_api_url = os.getenv("LLM_API_URL")
 llm_base_url = (_llm_api_url).rstrip("/")
 llm_api_key = os.getenv("LLM_API_KEY", os.getenv("LLM_API_PWD_LASSE", "not-set"))
--- a/etc/riksdagen-sync.service
+++ b/etc/riksdagen-sync.service
@ -0,0 +1,19 @@
+[Unit]
+Description=Riksdagen daily talk sync
+# Wait for network before starting
+After=network-online.target
+Wants=network-online.target
+
+[Service]
+Type=oneshot
+User=lasse
+WorkingDirectory=/home/lasse/riksdagen
+# Loads ARANGO_PWD and other env vars from the project .env file
+EnvironmentFile=/home/lasse/riksdagen/.env
+ExecStart=/home/lasse/riksdagen/.venv/bin/python /home/lasse/riksdagen/scripts/sync_talks.py
+# Log stdout/stderr to the systemd journal (view with: journalctl -u riksdagen-sync)
+StandardOutput=journal
+StandardError=journal
+
+[Install]
+WantedBy=multi-user.target
--- a/etc/riksdagen-sync.timer
+++ b/etc/riksdagen-sync.timer
@ -0,0 +1,11 @@
+[Unit]
+Description=Run riksdagen daily talk sync at 06:00
+
+[Timer]
+# Run every day at 06:00
+OnCalendar=*-*-* 06:00:00
+# If the server was off at 06:00, run the job as soon as it comes back up
+Persistent=true
+
+[Install]
+WantedBy=timers.target
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@ -256,7 +256,6 @@ function SearchView() {
 			const parsed = JSON.parse(stored) as {
 				query?: string;
 				filters?: SearchFilters;
-				results?: TalkHit[];
 				sortMode?: "relevance" | "date";
 				visibleCount?: number;
 				hasSearched?: boolean;
@ -274,13 +273,22 @@ function SearchView() {
 					to_year: parsed.filters.to_year ?? undefined,
 				});
 			}
-			if (Array.isArray(parsed.results)) setResults(parsed.results);
 			if (parsed.sortMode === "date" || parsed.sortMode === "relevance") setSortMode(parsed.sortMode);
 			if (typeof parsed.visibleCount === "number") setVisibleCount(parsed.visibleCount);
 			if ("hasSearched" in parsed) setHasSearched(Boolean(parsed.hasSearched));
 			if ("lastError" in parsed) setLastError(parsed.lastError ?? null);
 			setSpeaker(parsed.speaker ?? null);
 			setSpeakerIds(Array.isArray(parsed.speakerIds) ? parsed.speakerIds : []);
+			// If we have a query and filters, re-run the search automatically
+			if (parsed.query && parsed.filters) {
+				const cleanQuery = stripMentions(parsed.query);
+				searchMutation.mutate({
+					q: cleanQuery,
+					...parsed.filters,
+					speaker_ids: parsed.speakerIds && parsed.speakerIds.length > 0 ? parsed.speakerIds : undefined,
+					include_snippets: true,
+				});
+			}
 		} catch (error) {
 			console.error("Failed to restore search state from session storage:", error);
 			window.sessionStorage.removeItem(SEARCH_STATE_KEY);
@ -295,7 +303,6 @@ function SearchView() {
 		const persistableState = {
 			query,
 			filters,
-			results,
 			sortMode,
 			visibleCount,
 			hasSearched,
@ -303,8 +310,9 @@ function SearchView() {
 			speaker,
 			speakerIds,
 		};
+		// Only store lightweight state (no results)
 		window.sessionStorage.setItem(SEARCH_STATE_KEY, JSON.stringify(persistableState));
-	}, [query, filters, results, sortMode, visibleCount, hasSearched, lastError, speaker, speakerIds, hasHydratedSearch]);
+	}, [query, filters, sortMode, visibleCount, hasSearched, lastError, speaker, speakerIds, hasHydratedSearch]);

 	useEffect(() => {
 		// Any filter change while the user is interacting should reset pagination back to the first page.
--- a/frontend/src/components/ChatPanel.tsx
+++ b/frontend/src/components/ChatPanel.tsx
@ -297,13 +297,77 @@ export const ChatPanel = forwardRef<ChatPanelHandle, Props>(function ChatPanel(
        }
    };

+    /**
+     * Converts Markdown to HTML and replaces [1], [2], ... with <sup>1</sup> citations,
+     * but only outside of <a>, <code>, <pre>, <script>, <style>, and <sup> tags.
+     * This avoids breaking links, code, and already-superscripted numbers.
+     */
    const convertMarkdownToHtml = (markdown: string): string => {
-        /**
-         * Transform Markdown into safe HTML.
-         * RETURN_TRUSTED_TYPE=false guarantees a plain string for React.
-         */
+        // Parse markdown to HTML
        const rawHtml = marked.parse(markdown) as string;
-        const sanitized = DOMPurify.sanitize(rawHtml, { RETURN_TRUSTED_TYPE: false });
+
+        // Parse the HTML string into a DOM tree
+        const parser = new DOMParser();
+        const doc = parser.parseFromString(rawHtml, 'text/html');
+
+        // Define tags where we should NOT replace [n] with <sup>n</sup>
+        const SKIP_TAGS = new Set(['A', 'CODE', 'PRE', 'SCRIPT', 'STYLE', 'SUP']);
+
+        // Create a TreeWalker to traverse all text nodes in the body
+        const walker = doc.createTreeWalker(
+            doc.body,
+            NodeFilter.SHOW_TEXT,
+            {
+                acceptNode(node) {
+                    // Ignore empty or whitespace-only nodes
+                    if (!node.nodeValue || node.nodeValue.trim() === '') return NodeFilter.FILTER_REJECT;
+                    return NodeFilter.FILTER_ACCEPT;
+                }
+            } as any
+        );
+
+        let node: Node | null = walker.nextNode();
+        while (node) {
+            const parentEl = node.parentElement;
+            // Skip text nodes inside tags we don't want to touch
+            if (!parentEl || SKIP_TAGS.has(parentEl.tagName)) {
+                node = walker.nextNode();
+                continue;
+            }
+
+            // Replace [n] with <sup>n</sup> in this text node
+            const text = node.nodeValue!;
+            const parts: (Node)[] = [];
+            let lastIndex = 0;
+            const regex = /\[(\d+)\]/g;
+            let m: RegExpExecArray | null;
+            while ((m = regex.exec(text)) !== null) {
+                const idx = m.index;
+                // Add text before the match
+                if (idx > lastIndex) parts.push(document.createTextNode(text.slice(lastIndex, idx)));
+                // Add <sup>n</sup>
+                const sup = doc.createElement('sup');
+                sup.textContent = m[1];
+                parts.push(sup);
+                lastIndex = idx + m[0].length;
+            }
+            if (parts.length > 0) {
+                // Add any remaining text after the last match
+                if (lastIndex < text.length) parts.push(document.createTextNode(text.slice(lastIndex)));
+                // Replace the original text node with the new nodes
+                const parent = node.parentNode!;
+                for (const p of parts) parent.insertBefore(p, node);
+                parent.removeChild(node);
+            }
+
+            node = walker.nextNode();
+        }
+
+        // Serialize the DOM tree back to HTML
+        const htmlWithFootnotes = doc.body.innerHTML;
+
+        // Sanitize the HTML before returning
+        const sanitized = DOMPurify.sanitize(htmlWithFootnotes, { RETURN_TRUSTED_TYPE: false });
        return typeof sanitized === "string" ? sanitized : sanitized.toString();
    };

@ -336,7 +400,7 @@ export const ChatPanel = forwardRef<ChatPanelHandle, Props>(function ChatPanel(
                                type="button"
                                className="chat-rail__item"
                                data-active={turn.id === activeTurn?.id}
-                                data-distance={Math.min(index + 1, 4)} // Same cap for turns that are newer than the active one.
+                                data-distance={Math.min(index + 1, 4)} // Same cap for turns that are newer än the active one.
                                onClick={() => setSelectedTurnId(turn.id)}
                                title={turn.question}
                            >
--- a/frontend/src/components/TalkView.tsx
+++ b/frontend/src/components/TalkView.tsx
@ -1,6 +1,8 @@
 import { useQuery } from "@tanstack/react-query";
 import { useParams, Link, useNavigate } from "react-router-dom";
 import { fetchTalk } from "../api";
+import { marked } from "marked";
+import DOMPurify from "dompurify";

 /**
 * TalkView component displays a single talk with full details.
@ -51,8 +53,16 @@ export function TalkView() {
 		);
 	}

+	const convertMarkdownToHtml = (markdown: string): string => {
+		// Convert Markdown summaries to HTML while keeping the output safe to inject.
+		const rawHtml = marked.parse(markdown);
+		const sanitized = DOMPurify.sanitize(rawHtml);
+		return typeof sanitized === "string" ? sanitized : sanitized.toString();
+	};
+
 	// Fix image URLs from http to https
 	const imageUrl = talk.person?.bild_url_192?.replace('http://', 'https://');
+	const summaryHtml = talk.summary ? convertMarkdownToHtml(talk.summary) : null;
 	
 	const previousTalk = talk.navigation?.previous ?? null;
 	const nextTalk = talk.navigation?.next ?? null;
@ -124,7 +134,7 @@ export function TalkView() {
 					<img 
 						src={imageUrl} 
 						alt={talk.talare}
-						className="talk-view__speaker-photo"
+						className="talk-view__speaker-photo talk-view__speaker-photo--enhanced"
 					/>
 				)}
 				<div className="talk-view__speaker-info">
@ -172,6 +182,18 @@ export function TalkView() {
 				</dl>
 			</div>

+			{summaryHtml && (
+				<div className="panel talk-view__summary">
+					<div className="talk-view__summaryHeading">
+						<span role="img" aria-label="AI"></span> AI-genererad sammanfattning
+					</div>
+					<div
+						className="talk-view__summaryContent"
+						dangerouslySetInnerHTML={{ __html: summaryHtml }}
+					/>
+				</div>
+			)}
+
 			{/* Talk text */}
 			<div className="panel talk-view__text">
 				<div className="talk-view__content">
--- a/frontend/src/styles.css
+++ b/frontend/src/styles.css
@ -1290,6 +1290,43 @@ textarea {
 	min-width: 120px; /* Ensures each cell has enough space for a button */
 }

+/* AI summary panel styles */
+.talk-view__summary {
+	background: linear-gradient(90deg, #f3f6ff 80%, #eaf1fb 100%);
+	border: 1.5px dashed #7ea2e6;
+	color: #223b57;
+	margin-bottom: 1.2rem;
+}
+
+.talk-view__summaryHeading {
+	font-size: 1.08rem;
+	font-weight: 600;
+	color: #3a4a6b;
+	display: flex;
+	align-items: center;
+	gap: 0.5em;
+	margin-bottom: 0.5em;
+	letter-spacing: 0.01em;
+}
+
+.talk-view__summaryContent {
+	font-size: 1.01rem;
+	color: #223b57;
+}
+
+.talk-view__summaryContent > :first-child {
+	margin-top: 0;
+}
+
+.talk-view__summary :last-child {
+	margin-bottom: 0;
+}
+
+/* This class increases contrast and brightness for speaker photos */
+.talk-view__speaker-photo--enhanced {
+  filter: contrast(1.3) brightness(1.1);
+}
+
@media (max-width: 768px) {
 	.talk-view {
 		padding: 1.5rem 1rem;
--- a/home/Lasse/configs/mac_studion.conf
+++ b/home/Lasse/configs/mac_studion.conf
@ -0,0 +1,10 @@
+[Interface]
+PrivateKey = yDRb0EYZkUZCuYax44lSBAP3vmN+mPdDQEh2hAQ10lY=
+Address = 10.156.168.2/24
+DNS = 1.1.1.1, 1.0.0.1
+
+[Peer]
+PublicKey = 6gwhWDypmpxrGaobEh8xZIXvRIKdp0pWH6YWZ9F8twY=
+PresharedKey = XAD5qpUMr0Ouz2azeXfH7J5tE3iSi5XJOdzdrUTSbRg=
+Endpoint = 98.128.172.165:51820
+AllowedIPs = 0.0.0.0/0, ::0/0
--- a/mcp_server/init.py
+++ b/mcp_server/init.py
@ -0,0 +1,6 @@
+"""
+Public entry points for the Riksdagen MCP server package.
+"""
+from .server import run
+
+__all__ = ("run",)
--- a/mcp_server/auth.py
+++ b/mcp_server/auth.py
@ -0,0 +1,24 @@
+from __future__ import annotations
+
+import os
+import secrets
+
+
+def validate_token(provided_token: str) -> None:
+    """
+    Ensure the caller supplied the expected bearer token.
+
+    Args:
+        provided_token: Token received from the MCP client.
+
+    Raises:
+        RuntimeError: If the server token is not configured.
+        PermissionError: If the token is missing or incorrect.
+    """
+    expected_token = os.getenv("MCP_SERVER_TOKEN")
+    if not expected_token:
+        raise RuntimeError("MCP_SERVER_TOKEN environment variable must be set for authentication.")
+    if not provided_token:
+        raise PermissionError("Missing MCP access token.")
+    if not secrets.compare_digest(provided_token, expected_token):
+        raise PermissionError("Invalid MCP access token.")
--- a/mcp_server/check_cert.py
+++ b/mcp_server/check_cert.py
@ -0,0 +1,130 @@
+import ssl
+import socket
+from datetime import datetime
+from typing import Any, Dict, List, Optional
+import argparse
+import pprint
+import sys  # added to detect whether --host was passed
+
+def fetch_certificate(host: str, port: int = 443, server_hostname: Optional[str] = None, timeout: float = 5.0) -> Dict[str, Any]:
+	"""
+	Fetch the TLS certificate from host:port. This function intentionally
+	uses a non-verifying SSL context to retrieve the certificate even if it
+	doesn't validate, so we can inspect its fields.
+
+	Parameters:
+	- host: TCP connect target (can be an IP or hostname)
+	- port: TCP port (default 443)
+	- server_hostname: SNI value to send. If None, server_hostname = host.
+	- timeout: socket connect timeout in seconds
+
+	Returns:
+	Dictionary with the peer certificate (as returned by SSLSocket.getpeercert()) and additional metadata.
+	"""
+	if server_hostname is None:
+		server_hostname = host
+
+	# Create an SSL context that does NOT verify so we can always fetch the cert.
+	context = ssl.create_default_context()
+	context.check_hostname = False
+	context.verify_mode = ssl.CERT_NONE
+
+	with socket.create_connection((host, port), timeout=timeout) as sock:
+		with context.wrap_socket(sock, server_hostname=server_hostname) as sslsock:
+			cert = sslsock.getpeercert()
+			peer_cipher = sslsock.cipher()
+			peertime = datetime.utcnow().isoformat() + "Z"
+
+	info: Dict[str, Any] = {"peer_certificate": cert, "cipher": peer_cipher, "fetched_at": peertime, "server_hostname_used": server_hostname}
+	return info
+
+def parse_san(cert: Dict[str, Any]) -> List[str]:
+	"""Return list of DNS names from subjectAltName (if any)."""
+	san = []
+	for typ, val in cert.get("subjectAltName", ()):
+		if typ.lower() == "dns":
+			san.append(val)
+	return san
+
+def format_subject(cert: Dict[str, Any]) -> str:
+	"""Return a short human-friendly subject string."""
+	subject = cert.get("subject", ())
+	parts = []
+	for rdn in subject:
+		for k, v in rdn:
+			parts.append(f"{k}={v}")
+	return ", ".join(parts)
+
+def check_hostname_match(cert: Dict[str, Any], hostname: str) -> bool:
+	"""
+	Check whether the certificate matches hostname using ssl.match_hostname.
+	Returns True if match, False otherwise.
+	"""
+	try:
+		ssl.match_hostname(cert, hostname)
+		return True
+	except Exception:
+		return False
+
+def print_report(host: str, port: int, server_hostname: Optional[str]) -> None:
+	"""Fetch certificate and print a readable report."""
+	info = fetch_certificate(host=host, port=port, server_hostname=server_hostname)
+	cert = info["peer_certificate"]
+
+	print(f"Connected target: {host}:{port}")
+	print(f"SNI sent: {info['server_hostname_used']}")
+	print(f"Cipher: {info['cipher']}")
+	print(f"Fetched at (UTC): {info['fetched_at']}")
+	print()
+
+	print("Subject:")
+	print(" ", format_subject(cert))
+	print()
+
+	print("Issuer:")
+	issuer = cert.get("issuer", ())
+	issuer_parts = []
+	for rdn in issuer:
+		for k, v in rdn:
+			issuer_parts.append(f"{k}={v}")
+	print(" ", ", ".join(issuer_parts))
+	print()
+
+	sans = parse_san(cert)
+	print("Subject Alternative Names (SANs):")
+	if sans:
+		for n in sans:
+			print("  -", n)
+	else:
+		print("  (none)")
+
+	not_before = cert.get("notBefore")
+	not_after = cert.get("notAfter")
+	print()
+	print("Validity:")
+	print("  notBefore:", not_before)
+	print("  notAfter: ", not_after)
+
+	match = check_hostname_match(cert, server_hostname or host)
+	print()
+	print(f"Hostname match for '{server_hostname or host}':", "YES" if match else "NO")
+
+	# For debugging show the full cert dict if requested
+	# pprint.pprint(cert)
+
+def main() -> None:
+	parser = argparse.ArgumentParser(description="Fetch and inspect TLS certificate from a host (SNI-aware).")
+	# make --host optional and default to api.rixdagen.se so running without args works
+	parser.add_argument("--host", "-H", required=False, default="api.rixdagen.se", help="Host or IP to connect to (TCP target). Defaults to api.rixdagen.se")
+	parser.add_argument("--port", "-p", type=int, default=443, help="Port to connect to (default 443).")
+	parser.add_argument("--sni", help="SNI hostname to send. If omitted, the --host value is used as SNI.")
+	args = parser.parse_args()
+
+	# Notify when using the default host for quick testing
+	if ("--host" not in sys.argv) and ("-H" not in sys.argv):
+		print("No --host provided: defaulting to api.rixdagen.se (you can override with --host or -H)")
+
+	print_report(host=args.host, port=args.port, server_hostname=args.sni)
+
+if __name__ == "__main__":
+	main()
--- a/mcp_server/requirements.txt
+++ b/mcp_server/requirements.txt
--- a/mcp_server/server.py
+++ b/mcp_server/server.py
@ -0,0 +1,114 @@
+"""
+RiksdagenTools MCP server (HTTP only, compatible with current FastMCP version)
+"""
+from __future__ import annotations
+import asyncio
+import logging
+import os
+import inspect
+from typing import Any, Dict, List, Optional, Sequence
+from fastmcp import FastMCP
+from mcp_server.auth import validate_token
+from mcp_server import tools
+
+HOST = os.getenv("MCP_HOST", "127.0.0.1")
+PORT = int(os.getenv("MCP_PORT", "8010"))
+PATH = os.getenv("MCP_PATH", "/mcp")
+LOG_LEVEL = os.getenv("LOG_LEVEL", "INFO").upper()
+
+logging.basicConfig(
+    level=LOG_LEVEL,
+    format="%(asctime)s [%(levelname)s] %(name)s: %(message)s",
+    datefmt="%Y-%m-%d %H:%M:%S",
+)
+log = logging.getLogger("mcp_server")
+
+app = FastMCP("RiksdagenTools")
+
+# --- tools unchanged ---
+@app.tool()
+async def search_documents(token: str, aql_query: str) -> Dict[str, Any]:
+    validate_token(token)
+    return await asyncio.to_thread(tools.search_documents, aql_query)
+
+@app.tool()
+async def aql_query(token: str, query: str) -> List[Dict[str, Any]]:
+    validate_token(token)
+    return await asyncio.to_thread(tools.run_aql_query, query)
+
+@app.tool()
+async def vector_search_talks(token: str, query: str, limit: int = 8) -> List[Dict[str, Any]]:
+    validate_token(token)
+    return await asyncio.to_thread(tools.vector_search, query, limit)
+
+@app.tool()
+async def fetch_documents(
+    token: str, document_ids: Sequence[str], fields: Optional[Sequence[str]] = None
+) -> List[Dict[str, Any]]:
+    validate_token(token)
+    return await asyncio.to_thread(
+        tools.fetch_documents, list(document_ids), list(fields) if fields else None
+    )
+
+@app.tool()
+async def arango_search(
+    token: str,
+    query: str,
+    limit: int = 20,
+    parties: Optional[Sequence[str]] = None,
+    people: Optional[Sequence[str]] = None,
+    from_year: Optional[int] = None,
+    to_year: Optional[int] = None,
+    return_snippets: bool = False,
+    focus_ids: Optional[Sequence[str]] = None,
+    speaker_ids: Optional[Sequence[str]] = None,
+) -> Dict[str, Any]:
+    validate_token(token)
+    return await asyncio.to_thread(
+        tools.arango_search,
+        query,
+        limit,
+        parties,
+        people,
+        from_year,
+        to_year,
+        return_snippets,
+        focus_ids,
+        speaker_ids,
+    )
+
+@app.tool()
+async def ping() -> str:
+    """
+    Lightweight test tool for connectivity checks.
+
+    Returns:
+        A short confirmation string ("ok"). This tool is intentionally
+        unauthenticated so it can be used to validate the transport/proxy
+        (e.g. nginx -> backend) without presenting credentials.
+    """
+    return "ok"
+
+# --- Entrypoint ---
+def run() -> None:
+    log.info(
+        "Starting RiksdagenTools MCP server (HTTP) on http://%s:%d%s",
+        HOST,
+        PORT,
+        PATH,
+    )
+    
+    try:
+        # Pass host, port, and path directly to run() method
+        app.run(
+            transport="streamable-http",
+            host=HOST,
+            port=PORT,
+            path=PATH,
+        )
+    except Exception:
+        log.exception("Unexpected error while running the MCP server.")
+        raise
+
+if __name__ == "__main__":
+    run()
--- a/mcp_server/test_mcp_client.py
+++ b/mcp_server/test_mcp_client.py
@ -0,0 +1,168 @@
+"""
+Test script for the RiksdagenTools MCP server (HTTP transport).
+This script connects to the MCP server via Streamable HTTP and tests your main tools.
+Ensure the MCP server is running and that the environment variable MCP_SERVER_TOKEN is set.
+Also adjust MCP_SERVER_URL if needed.
+"""
+
+import os
+import asyncio
+from typing import Any, Dict, List, Optional, Sequence
+
+from mcp.client.streamable_http import streamablehttp_client
+from mcp.client.session import ClientSession   # adjusted import per SDK version
+
+TOKEN: str = os.environ.get("MCP_SERVER_TOKEN", "2q89rwpfaiukdjshp298n3qw")
+SERVER_URL: str = os.environ.get("MCP_SERVER_URL", "https://api.rixdagen.se/mcp")  # use the public HTTPS endpoint by default so tests target the nginx proxy
+
+async def run_tests() -> None:
+    """
+    Attempt to connect to SERVER_URL and run the tool tests. On SSL certificate
+    verification failures, optionally retry against the backend IP if
+    MCP_FALLBACK_TO_IP=1 is set (or a custom MCP_FALLBACK_URL is provided).
+    """
+    async def run_with_url(url: str) -> None:
+        print(f"Connecting to server URL: {url}")
+        async with streamablehttp_client(
+            url=url,
+            headers={ "Authorization": f"Bearer {TOKEN}" }
+        ) as (read_stream, write_stream, get_session_id):
+            async with ClientSession(read_stream, write_stream) as session:
+                # initialize the session (if needed)
+                init_result = await session.initialize()
+                print("Initialized session:", init_result)
+
+                print("\nListing available tools...")
+                tools_info = await session.list_tools()
+                print("Tools:", [ tool.name for tool in tools_info.tools ])
+
+                # Test aql_query
+                print("\n== Testing aql_query ==")
+                result1 = await session.call_tool(
+                    "aql_query",
+                    arguments={
+                        "token": TOKEN,
+                        "query": "FOR doc IN talks LIMIT 2 RETURN { _id: doc._id, talare: doc.talare }"
+                    }
+                )
+                print("aql_query result:", result1)
+
+                # Test search_documents
+                print("\n== Testing search_documents ==")
+                result2 = await session.call_tool(
+                    "search_documents",
+                    arguments={
+                        "token": TOKEN,
+                        "aql_query": "FOR doc IN talks LIMIT 2 RETURN { _id: doc._id, talare: doc.talare }"
+                    }
+                )
+                print("search_documents result:", result2)
+
+                # Test vector_search_talks
+                print("\n== Testing vector_search_talks ==")
+                result3 = await session.call_tool(
+                    "vector_search_talks",
+                    arguments={
+                        "token": TOKEN,
+                        "query": "klimatförändringar",
+                        "limit": 2
+                    }
+                )
+                print("vector_search_talks result:", result3)
+
+                # Test fetch_documents
+                print("\n== Testing fetch_documents ==")
+                # try to pull out IDs from result3 if available
+                doc_ids: List[str]
+                maybe = result3
+                if hasattr(maybe, "output") and isinstance(maybe.output, list) and maybe.output:
+                    doc_ids = [ maybe.output[0].get("_id", "") ]
+                else:
+                    doc_ids = ["talks/1"]
+                result4 = await session.call_tool(
+                    "fetch_documents",
+                    arguments={
+                        "token": TOKEN,
+                        "document_ids": doc_ids
+                    }
+                )
+                print("fetch_documents result:", result4)
+
+                # Test arango_search
+                print("\n== Testing arango_search ==")
+                result5 = await session.call_tool(
+                    "arango_search",
+                    arguments={
+                        "token": TOKEN,
+                        "query": "klimat",
+                        "limit": 2
+                    }
+                )
+                print("arango_search result:", result5)
+
+    # try primary URL first
+    try:
+        await run_with_url(SERVER_URL)
+    except Exception as e:  # capture failures from streamablehttp_client / httpx
+        err_str = str(e).lower()
+        ssl_fail = "certificate_verify_failed" in err_str or "hostname mismatch" in err_str or "certificate verify failed" in err_str
+        gateway_fail = "502" in err_str or "bad gateway" in err_str or "502 bad gateway" in err_str
+
+        if gateway_fail:
+            print("Received 502 Bad Gateway from the proxy when connecting to the server URL.")
+            # If user explicitly set fallback env var, retry against backend IP or custom fallback
+            fallback_flag = os.environ.get("MCP_FALLBACK_TO_IP", "0").lower() in ("1", "true", "yes")
+            if fallback_flag:
+                fallback_url = os.environ.get("MCP_FALLBACK_URL", "http://127.0.0.1:8010/mcp")
+                print(f"Retrying with fallback URL (MCP_FALLBACK_URL or default backend): {fallback_url}")
+                await run_with_url(fallback_url)
+                return
+            print("")
+            print("Possible causes:")
+            print("- The proxy (nginx) couldn't reach the backend (backend down, wrong proxy_pass or path).")
+            print("- Proxy buffering or HTTP version issues interfering with streaming transport.")
+            print("")
+            print("Options:")
+            print("- Bypass the proxy and target the backend directly:")
+            print("    export MCP_SERVER_URL='http://127.0.0.1:8010/mcp'")
+            print("- Or enable automatic fallback to the backend (insecure) for testing:")
+            print("    export MCP_FALLBACK_TO_IP=1")
+            print("    # optionally override the fallback target")
+            print("    export MCP_FALLBACK_URL='http://127.0.0.1:8010/mcp'")
+            print("- Check the proxy's error log (e.g. /var/log/nginx/error.log) for upstream errors.")
+            print("")
+            # re-raise so caller still sees the error if they don't follow guidance
+            raise
+
+        if ssl_fail:
+            print("SSL certificate verification failed while connecting to the server URL.")
+            # If user explicitly set fallback env var, retry against backend IP or custom fallback
+            fallback_flag = os.environ.get("MCP_FALLBACK_TO_IP", "0").lower() in ("1", "true", "yes")
+            if fallback_flag:
+                fallback_url = os.environ.get("MCP_FALLBACK_URL", "http://192.168.1.10:8010/mcp")
+                print(f"Retrying with fallback URL (MCP_FALLBACK_URL or default backend IP): {fallback_url}")
+                await run_with_url(fallback_url)
+                return
+            # Otherwise give actionable guidance
+            print("")
+            print("Possible causes:")
+            print("- The TLS certificate served for api.rixdagen.se does not match that hostname on this machine.")
+            print("")
+            print("Options:")
+            print("- Set MCP_SERVER_URL to the backend HTTP address to bypass TLS: e.g.")
+            print("    export MCP_SERVER_URL='http://192.168.1.10:8010/mcp'")
+            print("- Or enable automatic fallback to the backend IP for testing (insecure):")
+            print("    export MCP_FALLBACK_TO_IP=1")
+            print("    # optionally override the fallback target")
+            print("    export MCP_FALLBACK_URL='http://192.168.1.10:8010/mcp'")
+            print("")
+            # re-raise so caller still sees the error if they don't follow guidance
+            raise
+        # Not an SSL or gateway failure: re-raise
+        raise
+
+def main() -> None:
+    asyncio.run(run_tests())
+
+if __name__ == "__main__":
+    main()
--- a/mcp_server/test_mcp_ping.py
+++ b/mcp_server/test_mcp_ping.py
@ -0,0 +1,81 @@
+import os
+import sys
+import asyncio
+from typing import Tuple, Any
+
+from mcp.client.streamable_http import streamablehttp_client
+from mcp.client.session import ClientSession
+
+SERVER_URL: str = os.environ.get("MCP_SERVER_URL", "http://127.0.0.1:8010/mcp")
+TOKEN: str = os.environ.get("MCP_SERVER_TOKEN", "")
+
+
+async def _extract_ping_result(res: Any) -> Any:
+    """
+    Extract a sensible value from various CallToolResult shapes returned by the SDK.
+
+    Handles:
+    - objects with 'structuredContent' (dict) -> use 'result' or first value
+    - objects with 'output' attribute
+    - objects with 'content' list containing a TextContent with .text
+    - plain scalars
+    """
+    # structuredContent is common in newer SDK responses
+    if hasattr(res, "structuredContent") and isinstance(res.structuredContent, dict):
+        # prefer a 'result' key
+        if "result" in res.structuredContent:
+            return res.structuredContent["result"]
+        # fallback to any first value
+        for v in res.structuredContent.values():
+            return v
+
+    # older / alternative shape: an 'output' attribute
+    if hasattr(res, "output"):
+        return res.output
+
+    # textual content list (TextContent objects)
+    if hasattr(res, "content") and isinstance(res.content, list) and res.content:
+        first = res.content[0]
+        # Some SDK TextContent exposes 'text'
+        if hasattr(first, "text"):
+            return first.text
+        # fallback to stringifying the object
+        return str(first)
+
+    # final fallback: try direct indexing or string conversion
+    try:
+        return res["result"]
+    except Exception:
+        return str(res)
+
+
+async def check_ping(url: str, token: str) -> Tuple[bool, str]:
+    """
+    Connect to the MCP server at `url` and call the 'ping' tool.
+
+    Returns:
+        (ok, message) where ok is True if ping returned "ok", otherwise False.
+    """
+    headers = {"Authorization": f"Bearer {token}"} if token else {}
+    try:
+        async with streamablehttp_client(url=url, headers=headers) as (read_stream, write_stream, _):
+            async with ClientSession(read_stream, write_stream) as session:
+                await session.initialize()
+                res = await session.call_tool("ping", arguments={})
+                output = await _extract_ping_result(res)  # robust extractor
+                if output == "ok":
+                    return True, "ping -> ok"
+                return False, f"unexpected ping response: {output!r}"
+    except Exception as e:
+        return False, f"error connecting/calling ping: {e!r}"
+
+
+def main() -> None:
+    ok, msg = asyncio.run(check_ping(SERVER_URL, TOKEN))
+    print(msg)
+    if not ok:
+        sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()
--- a/mcp_server/test_tools.py.py
+++ b/mcp_server/test_tools.py.py
@ -0,0 +1,75 @@
+#!/usr/bin/env python3
+"""
+Quick test script for MCP server tools.
+Run:  python test_tools.py
+"""
+
+import asyncio
+import json
+from pprint import pprint
+
+from mcp_server import tools
+
+
+async def main():
+    print("🔍 Testing MCP server tools...\n")
+
+    # 1. Ping (simulated, since it's just "ok")
+    print("1️⃣  ping → ok")
+    print("   ✅", "ok\n")
+
+    # 2. Search documents with a trivial AQL (read-only)
+    try:
+        aql = "FOR d IN riksdagen LIMIT 1 RETURN d"
+        print("2️⃣  search_documents...")
+        result = await asyncio.to_thread(tools.search_documents, aql)
+        print("   ✅ rows:", result["row_count"])
+    except Exception as e:
+        print("   ❌ search_documents failed:", e)
+    print()
+
+    # 3. Run AQL query directly
+    try:
+        aql = "FOR d IN riksdagen LIMIT 1 RETURN d"
+        print("3️⃣  run_aql_query...")
+        rows = await asyncio.to_thread(tools.run_aql_query, aql)
+        print("   ✅ got", len(rows), "rows")
+    except Exception as e:
+        print("   ❌ run_aql_query failed:", e)
+    print()
+
+    # 4. Vector search (Chroma)
+    try:
+        print("4️⃣  vector_search_talks...")
+        hits = await asyncio.to_thread(tools.vector_search, "klimatpolitik", 3)
+        print(f"   ✅ got {len(hits)} hits")
+        if hits:
+            print("   →", hits[0])
+    except Exception as e:
+        print("   ❌ vector_search_talks failed:", e)
+    print()
+
+    # 5. Fetch documents
+    try:
+        print("5️⃣  fetch_documents (demo id)...")
+        # Adjust a known _id if needed; using a dummy for now
+        docs = await asyncio.to_thread(tools.fetch_documents, ["riksdagen/1"])
+        print("   ✅ got", len(docs), "docs")
+    except Exception as e:
+        print("   ❌ fetch_documents failed:", e)
+    print()
+
+    # 6. Arango search
+    try:
+        print("6️⃣  arango_search...")
+        result = await asyncio.to_thread(tools.arango_search, "budget", 3)
+        print("   ✅ got", len(result.get("results", [])), "hits")
+    except Exception as e:
+        print("   ❌ arango_search failed:", e)
+    print()
+
+    print("🏁 Done.\n")
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
--- a/mcp_server/tools.py
+++ b/mcp_server/tools.py
@ -0,0 +1,360 @@
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Any, Dict, Iterable, List, Optional, Sequence
+from pydantic import BaseModel, Field
+
+import env_manager
+
+env_manager.set_env()
+
+from arango.collection import Collection  # noqa: E402
+from arango_client import arango  # noqa: E402
+from backend.services.search import SearchService  # noqa: E402
+from _chromadb.chroma_client import chroma_db  # noqa: E402
+
+
+class HitDocument(BaseModel):
+    """
+    HitDocument is a Pydantic model that provides a normalized representation of a search hit across various tools, enabling consistent downstream handling.
+
+    Attributes:
+        id (Optional[str]): Fully qualified ArangoDB document identifier.
+        key (Optional[str]): Document key without collection prefix.
+        speaker (Optional[str]): Name of the speaker associated with the hit.
+        party (Optional[str]): Party affiliation of the speaker.
+        date (Optional[str]): ISO formatted document date (YYYY-MM-DD).
+        snippet (Optional[str]): Contextual snippet or highlight from the document.
+        text (Optional[str]): Full text of the document when available.
+        score (Optional[float]): Relevance score supplied by the executing tool.
+        metadata (Dict[str, Any]): Additional metadata specific to the originating tool that should be preserved.
+
+    Methods:
+        to_string() -> str:
+            Renders the hit as a human-readable string with uppercase labels, including all present fields and metadata.
+    """
+
+    """Normalized representation of a search hit across tools to enable consistent downstream handling."""
+    id: Optional[str] = Field(
+        default=None, description="Fully qualified ArangoDB document identifier."
+    )
+    key: Optional[str] = Field(
+        default=None, description="Document key without collection prefix."
+    )
+    speaker: Optional[str] = Field(
+        default=None, description="Name of the speaker associated with the hit."
+    )
+    party: Optional[str] = Field(
+        default=None, description="Party affiliation of the speaker."
+    )
+    date: Optional[str] = Field(
+        default=None, description="ISO formatted document date (YYYY-MM-DD)."
+    )
+    snippet: Optional[str] = Field(
+        default=None, description="Contextual snippet or highlight from the document."
+    )
+    text: Optional[str] = Field(
+        default=None, description="Full text of the document when available."
+    )
+    score: Optional[float] = Field(
+        default=None, description="Relevance score supplied by the executing tool."
+    )
+    metadata: Dict[str, Any] = Field(
+        default_factory=dict,
+        description="Additional metadata specific to the originating tool that should be preserved.",
+    )
+
+    def to_string(self, include_metadata: bool = True) -> str:
+        """
+        Render the object as a human-readable string with uppercase labels.
+
+        Args:
+            include_metadata (bool, optional): Whether to include metadata fields in the output. Defaults to True.
+
+        Returns:
+            str: A formatted string representation of the object, with each field and its value separated by double newlines, and field names in uppercase.
+        """
+        data: Dict[str, Any] = self.model_dump(exclude_none=True)
+        metadata: Dict[str, Any] = data.pop("metadata", {})
+        segments: List[str] = []
+        for field_name, field_value in data.items():
+            segments.append(f"{field_name.upper()}\n{field_value}")
+        for meta_key, meta_value in metadata.items():
+            segments.append(f"{meta_key.upper()}\n{meta_value}")
+        return "\n\n".join(segments)
+
+
+class HitsResponse(BaseModel):
+    """
+    HitsResponse is a Pydantic model that serves as a container for multiple HitDocument instances, providing utility methods for formatting and rendering the collection.
+
+    Attributes:
+        hits (List[HitDocument]): A list of collected search hits.
+
+    Methods:
+        to_string() -> str:
+            Returns a string representation of all hits, separated by a visual divider. If there are no hits, returns an empty string.
+    """
+
+    hits: List[HitDocument] = Field(
+        default_factory=list, description="Collected search hits."
+    )
+
+    def to_string(self, include_metadata=True) -> str:
+        """
+        Render all hits as a single string, separated by a visual divider.
+
+        Args:
+            include_metadata (bool, optional): Whether to include metadata in each hit's string representation. Defaults to True.
+
+        Returns:
+            str: A single string containing all hits, separated by "\n\n---\n\n". Returns an empty string if there are no hits.
+        """
+        """Render all hits as a single string separated by a visual divider."""
+        if not self.hits:
+            return ""
+        return "\n\n---\n\n".join(
+            hit.to_string(include_metadata=include_metadata) for hit in self.hits
+        )
+
+
+
+def ensure_read_only_aql(query: str) -> None:
+    """
+    Reject AQL statements that attempt to mutate data or omit a RETURN clause.
+
+    Args:
+        query: Raw AQL statement from the client.
+
+    Raises:
+        ValueError: If the query looks unsafe.
+    """
+    normalized = query.upper()
+    forbidden = (
+        "INSERT ",
+        "UPDATE ",
+        "UPSERT ",
+        "REMOVE ",
+        "REPLACE ",
+        "DELETE ",
+        "DROP ",
+        "TRUNCATE ",
+        "UPSERT ",
+        "MERGE ",
+    )
+    if any(keyword in normalized for keyword in forbidden):
+        raise ValueError("Only read-only AQL queries are allowed.")
+    if " RETURN " not in normalized and not normalized.strip().startswith("RETURN "):
+        raise ValueError("AQL queries must include a RETURN clause.")
+
+
+def strip_private_fields(document: Dict[str, Any]) -> Dict[str, Any]:
+    """
+    Remove large internal fields from a document dictionary.
+
+    Args:
+        document: Document returned by ArangoDB.
+
+    Returns:
+        Sanitized copy without chunk payloads.
+    """
+    if "chunks" in document:
+        del document["chunks"]
+    return document
+
+
+def search_documents(aql_query: str) -> Dict[str, Any]:
+    """
+    Execute a read-only AQL query and return the result set together with the query string.
+
+    Args:
+        aql_query: Read-only AQL statement supplied by the client.
+
+    Returns:
+        Dictionary containing the executed AQL string, row count, and result rows.
+    """
+    ensure_read_only_aql(aql_query)
+    rows = [strip_private_fields(doc) for doc in arango.execute_aql(aql_query)]
+    return {
+        "aql": aql_query,
+        "row_count": len(rows),
+        "rows": rows,
+    }
+
+
+def run_aql_query(aql_query: str) -> List[Dict[str, Any]]:
+    """
+    Execute a read-only AQL query and return the rows.
+
+    Args:
+        aql_query: Read-only AQL statement.
+
+    Returns:
+        List of result rows.
+    """
+    ensure_read_only_aql(aql_query)
+    return [strip_private_fields(doc) for doc in arango.execute_aql(aql_query)]
+
+
+def _get_existing_collection(name: str) -> Collection:
+    """
+    Fetch an existing Chroma collection without creating new data.
+
+    Args:
+        name: Collection identifier.
+
+    Returns:
+        The requested collection.
+
+    Raises:
+        ValueError: If the collection is absent.
+    """
+    available = {collection.name for collection in chroma_db._client.list_collections()}
+    if name not in available:
+        raise ValueError(f"Chroma collection '{name}' does not exist.")
+    return chroma_db._client.get_collection(name=name)
+
+
+def vector_search(query: str, limit: int) -> List[Dict[str, Any]]:
+    """
+    Perform semantic search against the pre-built Chroma collection.
+
+    Args:
+        query: Free-form search text.
+        limit: Maximum number of hits to return.
+
+    Returns:
+        List of hit dictionaries with metadata and scores.
+    """
+    collection_name = chroma_db.path.split("/")[-1]  # ...existing code...
+    chroma_collection = _get_existing_collection(collection_name)
+    results = chroma_collection.query(
+        query_texts=[query],
+        n_results=limit,
+    )
+    metadatas = results.get("metadatas") or []
+    documents = results.get("documents") or []
+    ids = results.get("ids") or []
+    distances = results.get("distances") or []
+
+    def as_int(value: Any, default: int = -1) -> int:
+        if isinstance(value, int):
+            return value
+        if isinstance(value, float) and value.is_integer():
+            return int(value)
+        if isinstance(value, str) and value.strip().lstrip("+-").isdigit():
+            return int(value)
+        return default
+
+    hits: List[Dict[str, Any]] = []
+    for index, metadata in enumerate(metadatas[0] if metadatas else []):
+        meta = metadata or {}
+        document = documents[0][index] if documents else ""
+        identifier = ids[0][index] if ids else ""
+        hit = {
+            "_id": meta.get("_id") or identifier,
+            "heading": meta.get("heading") or meta.get("title") or meta.get("talare"),
+            "snippet": meta.get("snippet") or meta.get("text") or document,
+            "debateurl": meta.get("debateurl") or meta.get("debate_url"),
+            "chunk_index": as_int(meta.get("chunk_index") or meta.get("index")),
+            "score": distances[0][index] if distances else None,
+        }
+        if hit["_id"]:
+            hits.append(hit)
+    return hits
+
+
+def fetch_documents(document_ids: Sequence[str], fields: Optional[Iterable[str]] = None) -> List[Dict[str, Any]]:
+    """
+    Pull full documents by _id while stripping heavy fields.
+
+    Args:
+        document_ids: Iterable with fully qualified Arango document ids.
+        fields: Optional subset of fields to return.
+
+    Returns:
+        List of sanitized documents.
+    """
+    ids = [doc_id.replace("\\", "/") for doc_id in document_ids]
+    query = """
+    FOR id IN @document_ids
+        RETURN DOCUMENT(id)
+    """
+    documents = arango.execute_aql(query, bind_vars={"document_ids": ids})
+    if fields:
+        return [{field: doc.get(field) for field in fields if field in doc} for doc in documents]
+    return [strip_private_fields(doc) for doc in documents]
+
+
+@dataclass
+class SearchPayload:
+    """
+    Lightweight container passed to SearchService.search.
+    """
+    q: str
+    parties: Optional[List[str]]
+    people: Optional[List[str]]
+    debates: Optional[List[str]]
+    from_year: Optional[int]
+    to_year: Optional[int]
+    limit: int
+    return_snippets: bool
+    focus_ids: Optional[List[str]]
+    speaker_ids: Optional[List[str]]
+    speaker: Optional[str] = None
+
+
+def arango_search(
+    query: str,
+    limit: int,
+    parties: Optional[Sequence[str]] = None,
+    people: Optional[Sequence[str]] = None,
+    from_year: Optional[int] = None,
+    to_year: Optional[int] = None,
+    return_snippets: bool = False,
+    focus_ids: Optional[Sequence[str]] = None,
+    speaker_ids: Optional[Sequence[str]] = None,
+) -> Dict[str, Any]:
+    """
+    Run an ArangoSearch query using the existing SearchService utilities.
+
+    Args:
+        query: Search expression (supports AND/OR/NOT and phrases).
+        limit: Maximum number of hits to return.
+        parties: Party filters.
+        people: Speaker name filters.
+        from_year: Start year filter.
+        to_year: End year filter.
+        return_snippets: Whether only snippets should be returned.
+        focus_ids: Optional list restricting the search scope.
+        speaker_ids: Optional list of speaker identifiers.
+
+    Returns:
+        Dictionary containing results, stats, limit flag, and focus_ids for follow-up queries.
+    """
+    payload = SearchPayload(
+        q=query,
+        parties=list(parties) if parties else None,
+        people=list(people) if people else None,
+        debates=None,
+        from_year=from_year,
+        to_year=to_year,
+        limit=limit,
+        return_snippets=return_snippets,
+        focus_ids=list(focus_ids) if focus_ids else None,
+        speaker_ids=list(speaker_ids) if speaker_ids else None,
+    )
+    service = SearchService()
+    results, stats, limit_reached = service.search(
+        payload=payload,
+        include_snippets=True,
+        return_snippets=return_snippets,
+        focus_ids=payload.focus_ids,
+    )
+    return {
+        "results": results,
+        "stats": stats,
+        "limit_reached": limit_reached,
+        "return_snippets": return_snippets,
+        "focus_ids": [hit["_id"] for hit in results if isinstance(hit, dict) and hit.get("_id")],
+    }
--- a/page_063.png
+++ b/page_063.png
--- a/providers.template.yaml
+++ b/providers.template.yaml
@ -0,0 +1,113 @@
+# Template for providers.yaml
+#
+# You can add any OpenAI API compatible provider to the "providers" list.
+# For each provider you must also specify a list of models, along with model abilities.
+#
+# All fields are required unless marked as optional.
+#
+# Refer to your provider's API documentation for specific
+# details such as model identifiers, capabilities etc
+#
+# Note: Since the OpenAI API is not a standard we can't guarantee that all
+# providers will work correctly with Raycast AI.
+#
+# To use this template rename as `providers.yaml`
+#
+providers:
+  - id: perplexity
+    name: Perplexity
+    base_url: https://api.perplexity.ai
+    # Specify at least one api key if authentication is required.
+    # Optional if authentication is not required or is provided elsewhere.
+    # If individual models require separate api keys, then specify a separate `key` for each model's `provider`
+    api_keys:
+      perplexity: PERPLEXITY_KEY
+    # Optional additional parameters sent to the `/chat/completions` endpoint
+    additional_parameters:
+      return_images: true
+      web_search_options:
+        search_context_size: medium
+    # Specify all models to use with the current provider
+    models:
+      - id: sonar # `id` must match the identifier used by the provider
+        name: Sonar # name visible in Raycast
+        provider: perplexity # Only required if mapping to a specific api key
+        description: Perplexity AI model for general-purpose queries # optional
+        context: 128000 # refer to provider's API documentation
+        # Optional abilities - all child properties are also optional.
+        # If you specify abilities incorrectly the model may fail to work as expected in Raycast AI.
+        # Refer to provider's API documentation for model abilities.
+        abilities:
+          temperature:
+            supported: true
+          vision:
+            supported: true
+          system_message:
+            supported: true
+          tools:
+            supported: false
+          reasoning_effort:
+            supported: false
+      - id: sonar-pro
+        name: Sonar Pro
+        description: Perplexity AI model for complex queries
+        context: 200000
+        abilities:
+          temperature:
+            supported: true
+          vision:
+            supported: true
+          system_message:
+            supported: true
+  # provider with multiple api keys
+  - id: my_provider
+    name: My Provider
+    base_url: http://localhost:4000
+    api_keys:
+      openai: OPENAI_KEY
+      anthropic: ANTHROPIC_KEY
+    models:
+      - id: gpt-4o
+        name: "GPT-4o"
+        context: 200000
+        provider: openai # matches "openai" in api_keys
+        abilities:
+          temperature:
+            supported: true
+          vision:
+            supported: true
+          system_message:
+            supported: true
+          tools:
+            supported: true
+      - id: claude-sonnet-4
+        name: "Claude Sonnet 4"
+        context: 200000
+        provider: anthropic # matches "anthropic" in api_keys
+        abilities:
+          temperature:
+            supported: true
+          vision:
+            supported: true
+          system_message:
+            supported: true
+          tools:
+            supported: true
+  - id: litellm
+    name: LiteLLM
+    base_url: http://localhost:4000
+    # No `api_keys` - authentication is provided by the LiteLLM config
+    models:
+      - id: anthropic/claude-sonnet-4-20250514
+        name: "Claude Sonnet 4"
+        context: 200000
+        abilities:
+          temperature:
+            supported: true
+          vision:
+            supported: true
+          system_message:
+            supported: true
+          tools:
+            supported: true
+
--- a/providers.yaml
+++ b/providers.yaml
@ -0,0 +1,20 @@
+providers:
+  - id: vllm
+    name: vLLM Instance
+    base_url: https://lasseedfast.se/vllm
+    api_keys:
+      vllm: "ap98sfoiuajcnwe89sozchnsw9oeacislh"
+    models:
+      - id: "gpt-oss:20b"
+        name: "GPT OSS 20B (Main)"
+        provider: vllm
+        context: 16000
+        abilities:
+          temperature:
+            supported: true
+          vision:
+            supported: false
+          system_message:
+            supported: true
+          tools:
+            supported: true
--- a/scripts/convert_embeddings_to_lists.py
+++ b/scripts/convert_embeddings_to_lists.py
@ -1,182 +0,0 @@
-#!/usr/bin/env python3
-"""
-Convert stored embeddings to plain Python lists for an existing Chroma collection.
-
-Usage:
-  # Dry run (inspect first 50 ids)
-  python scripts/convert_embeddings_to_lists.py --collection talks --limit 50 --dry-run
-
-  # Full run (no dry run)
-  python scripts/convert_embeddings_to_lists.py --collection talks
-
-Notes:
- Run from your project root (same env you use to access chroma_db).
- Back up chromadb_data before running.
-"""
-import argparse
-import json
-import os
-import time
-from pathlib import Path
-from typing import List
-import math
-import sys
-
-# Use the same imports/bootstrapping as you already have in your project
-# so the same chroma client and embedding function are loaded.
-# Adjust the import path if necessary.
-os.chdir("/home/lasse/riksdagen")
-sys.path.append("/home/lasse/riksdagen")
-
-import numpy as np
-from _chromadb.chroma_client import chroma_db
-
-CHECKPOINT_DIR = Path("var/chroma_repair")
-CHECKPOINT_DIR.mkdir(parents=True, exist_ok=True)
-
-def normalize_embedding(emb):
-    """
-    Convert a single embedding to a plain Python list[float].
-    Accepts numpy arrays, array-likes, lists.
-    """
-    # numpy ndarray
-    if isinstance(emb, np.ndarray):
-        return emb.tolist()
-    # Some array-likes (pandas/other) may have tolist()
-    if hasattr(emb, "tolist") and not isinstance(emb, list):
-        try:
-            return emb.tolist()
-        except Exception:
-            pass
-    # If it's already a list of numbers, convert elements to float
-    if isinstance(emb, list):
-        return [float(x) for x in emb]
-    # last resort: try iterating
-    try:
-        return [float(x) for x in emb]
-    except Exception:
-        raise ValueError("Cannot normalize embedding of type: %s" % type(emb))
-
-def chunked_iter(iterable, n):
-    it = iter(iterable)
-    while True:
-        chunk = []
-        try:
-            for _ in range(n):
-                chunk.append(next(it))
-        except StopIteration:
-            pass
-        if not chunk:
-            break
-        yield chunk
-
-def load_checkpoint(name):
-    path = CHECKPOINT_DIR / f"{name}.json"
-    if path.exists():
-        return json.load(path)
-    return {"last_index": 0, "processed_ids": []}
-
-def save_checkpoint(name, data):
-    path = CHECKPOINT_DIR / f"{name}.json"
-    with open(path, "w") as f:
-        json.dump(data, f)
-
-def main():
-    parser = argparse.ArgumentParser()
-    parser.add_argument("--collection", required=True, help="Chroma collection name (e.g. talks)")
-    parser.add_argument("--batch", type=int, default=1000, help="Batch size for update (default 1000)")
-    parser.add_argument("--dry-run", action="store_true", help="Dry run: don't write updates, just report")
-    parser.add_argument("--limit", type=int, default=None, help="Limit total number of ids to process (for testing)")
-    parser.add_argument("--checkpoint-name", default=None, help="Name for checkpoint file (defaults to collection name)")
-    args = parser.parse_args()
-
-    coll_name = args.collection
-    checkpoint_name = args.checkpoint_name or coll_name
-
-    print(f"Connecting to Chroma collection '{coll_name}'...")
-    col = chroma_db.get_collection(coll_name)
-
-    # Get the full list of ids. For 600k this should be okay to hold in memory,
-    # but if you need a more streaming approach, tell me and I can adapt.
-    all_info = col.get(include=[])  # may return {'ids': [...]} as in your env
-    ids = list(all_info.get("ids", []))
-    total_ids = len(ids)
-    if args.limit:
-        ids = ids[: args.limit]
-        total_process = len(ids)
-    else:
-        total_process = total_ids
-
-    print(f"Found {total_ids} ids in collection; will process {total_process} ids (limit={args.limit})")
-
-    # load checkpoint
-    ck = load_checkpoint(checkpoint_name)
-    start_index = ck.get("last_index", 0)
-    print(f"Resuming at index {start_index}")
-
-    # iterate in batches starting from last_index
-    processed = 0
-    for i in range(start_index, total_process, args.batch):
-        batch_ids = ids[i : i + args.batch]
-        print(f"\nProcessing batch {i}..{i+len(batch_ids)-1} (count={len(batch_ids)})")
-
-        # fetch full info for this batch (documents, metadatas, embeddings)
-        # we only need embeddings for this repair, but include docs/meta for verification if you want
-        try:
-            items = col.get(ids=batch_ids, include=["embeddings", "documents", "metadatas"])
-        except Exception as e:
-            print("Error fetching batch:", e)
-            # do a small retry after sleep
-            time.sleep(2)
-            items = col.get(ids=batch_ids, include=["embeddings", "documents", "metadatas"])
-
-        batch_embeddings = items.get("embeddings", [])
-        # items.get("ids") should match batch_ids order; if not, align by ids
-        ids_from_get = items.get("ids", batch_ids)
-        if len(ids_from_get) != len(batch_ids):
-            print("Warning: length mismatch between requested ids and returned ids")
-
-        # Normalize embeddings
-        normalized_embeddings = []
-        failed = False
-        for idx, emb in enumerate(batch_embeddings):
-            try:
-                norm = normalize_embedding(emb)
-            except Exception as e:
-                print(f"Failed to normalize embedding for id {ids_from_get[idx]}: {e}")
-                failed = True
-                break
-            normalized_embeddings.append(norm)
-
-        if failed:
-            print("Skipping this batch due to failures. You can adjust batch size and retry.")
-            break
-
-        # Dry-run: just print stats and continue
-        if args.dry_run:
-            # show a sample
-            sample_i = min(3, len(normalized_embeddings))
-            print("Sample normalized embedding lengths:", [len(normalized_embeddings[k]) for k in range(sample_i)])
-            # Optionally inspect first few floats
-            print("Sample values (first 6 floats):", [normalized_embeddings[k][:6] for k in range(sample_i)])
-        else:
-            # Update the collection in place (update will upsert embeddings for given ids)
-            try:
-                col.update(ids=ids_from_get, embeddings=normalized_embeddings)
-            except Exception as e:
-                print("Update failed, retrying once after short sleep:", e)
-                time.sleep(2)
-                col.update(ids=ids_from_get, embeddings=normalized_embeddings)
-
-            print(f"Updated {len(normalized_embeddings)} embeddings in collection '{coll_name}'")
-
-        # checkpoint progress
-        ck["last_index"] = i + len(batch_ids)
-        save_checkpoint(checkpoint_name, ck)
-        processed += len(batch_ids)
-
-    print(f"\nDone. Processed {processed} ids. Checkpoint saved to {CHECKPOINT_DIR / (checkpoint_name + '.json')}")
-    print("Reminder: run a few queries to validate search quality.")
-
-if __name__ == "__main__":
-    main()
--- a/scripts/debates.py
+++ b/scripts/debates.py
@ -1,5 +1,4 @@
 import os
-import numpy as np
 from time import sleep
 import sys
 from pathlib import Path
@ -18,7 +17,32 @@ from arango_client import arango
 from colorprinter import *


-from scripts.build_embeddings import assign_debate_ids
+def assign_debate_ids(
+    docs: list[dict], date: str
+) -> list[dict]:
+    """
+    Assigns a debate id to each talk in a list of talks for a given date.
+    A new debate starts whenever replik == False.
+    The debate id is a string: "{date}:{debate_index}".
+
+    Args:
+        docs (list[dict]): List of talk dicts, each with a 'replik' field.
+        date (str): The date string used as the prefix for debate IDs.
+
+    Returns:
+        list[dict]: The same dicts with a 'debate' field added.
+    """
+    debate_index = 0
+    current_debate_id = f"{date}:{debate_index}"
+    updated_docs = []
+    for doc in docs:
+        if not doc.get("replik", False):
+            debate_index += 1
+            current_debate_id = f"{date}:{debate_index}"
+        doc_with_debate = dict(doc)
+        doc_with_debate["debate"] = current_debate_id
+        updated_docs.append(doc_with_debate)
+    return updated_docs


 def make_debate_ids():
@ -110,7 +134,7 @@ def process_debate_date(date: str, system_message: str) -> None:
        bind_vars={"date": date},
    ))
    for debate in debates:
-        llm = LLM(model="vllm", temperature=0.1, system_message=system_message)
+        llm = LLM(model="vllm", temperature=0.2, system_message=system_message)
        # Fetch the talks in this debate
        talks = arango.db.aql.execute(
            """
--- a/scripts/documents_to_arango.py
+++ b/scripts/documents_to_arango.py
@ -12,6 +12,9 @@ from arango_client import arango

 logging.basicConfig(level=logging.WARNING, format="%(asctime)s - %(levelname)s - %(message)s")

+# Module-level collection so it's available both when run directly and when imported
+arango_collection = arango.db.collection("talks")
+


 def clean_text(text: str) -> str:
@ -114,7 +117,6 @@ if __name__ == "__main__":
    )
    for doc_key in cursor:
        already_processed.add(doc_key)
-    arango_collection = arango.db.collection("talks")
    folders_in_talks = os.listdir("talks")
    for folder in folders_in_talks:
        path = f"/home/lasse/riksdagen/talks/{folder}"
--- a/scripts/fix_things.py
+++ b/scripts/fix_things.py
@ -0,0 +1,25 @@
+from arango_client import arango
+
+chunks_collection = arango.db.collection("chunks")
+
+q = """
+FOR chunk IN chunks
+FILTER chunk.parent_id == null
+RETURN chunk
+"""
+
+cursor = arango.db.aql.execute(q, batch_size=1000, count=True, ttl=360)
+updated_docs = []
+n = 0
+for doc in cursor:
+    n += 1
+    doc['collection'] = 'talks'
+    del doc['chroma_collecton']
+    del doc['chroma_id']
+    doc['parent_id'] = f"talks/{doc['_key'].split(':')[0]}"
+    updated_docs.append(doc)
+    if len(updated_docs) >= 100:
+        chunks_collection.update_many(updated_docs, merge=False, silent=True)
+        updated_docs = []
+        print(f"Updated {n} documents", end="\r")
+chunks_collection.update_many(updated_docs, merge=False, silent=True)
--- a/scripts/make_arango_embeddings.py
+++ b/scripts/make_arango_embeddings.py
@ -0,0 +1,173 @@
+import os
+import sys
+import logging
+
+# Silence the per-request HTTP logs from the ollama/httpx library
+logging.getLogger("httpx").setLevel(logging.WARNING)
+
+os.chdir("/home/lasse/riksdagen")
+sys.path.append("/home/lasse/riksdagen")
+
+from arango_client import arango
+from ollama import Client as Ollama
+from arango.collection import Collection
+from concurrent.futures import ThreadPoolExecutor, as_completed
+from typing import List, Dict
+from time import sleep
+from utils import TextChunker
+
+
+def make_embeddings(texts: List[str]) -> List[List[float]]:
+    """
+    Generate embeddings for a list of texts using Ollama.
+
+    Args:
+        texts (List[str]): List of text strings to embed.
+
+    Returns:
+        List[List[float]]: List of embedding vectors.
+    """
+    ollama_client = Ollama(host='192.168.1.12:33405')
+    embeddings = ollama_client.embed(
+        model="qwen3-embedding:latest",
+        input=texts,
+        dimensions=384,
+    )
+    return embeddings.embeddings
+
+
+def process_chunk_batch(chunk_batch: List[Dict]) -> List[Dict]:
+    """
+    Generate embeddings for a batch of chunks and attach them.
+
+    Args:
+        chunk_batch (List[Dict]): List of chunk dicts, each with a 'text' field.
+
+    Returns:
+        List[Dict]: Same list with an 'embedding' field added to each dict.
+    """
+    sleep(1)
+    texts = [chunk['text'] for chunk in chunk_batch]
+    embeddings = make_embeddings(texts)
+    for i, chunk in enumerate(chunk_batch):
+        chunk['embedding'] = embeddings[i]
+    return chunk_batch
+
+
+def make_arango_embeddings() -> int:
+    """
+    Chunks and embeds all talks that are not yet represented in the 'chunks' collection.
+
+    For each talk that has no chunks in the collection yet:
+      - If the talk document already has a 'chunks' field (legacy path), those are used.
+      - Otherwise the speech text is split into chunks using TextChunker.
+    Embedding vectors are generated via Ollama and stored in the 'chunks' collection.
+
+    Each chunk document in ArangoDB has:
+      _key      : "{talk_key}:{chunk_index}"  (unique within the collection)
+      text      : the chunk text
+      index     : chunk index within the talk
+      parent_id : "talks/{talk_key}"  (links back to the source talk)
+      collection: "talks"
+      embedding : the vector (list of floats)
+
+    Returns:
+        int: Total number of chunk documents inserted/updated.
+    """
+    if not arango.db.has_collection("chunks"):
+        chunks_collection: Collection = arango.db.create_collection("chunks")
+    else:
+        chunks_collection: Collection = arango.db.collection("chunks")
+
+    # Find every talk that has no entry yet in the chunks collection.
+    # The inner FOR loop returns [] if no match exists (acts as NOT EXISTS).
+    cursor = arango.db.aql.execute(
+        """
+        FOR p IN talks
+            FILTER p.anforandetext != null AND p.anforandetext != ""
+            FILTER (
+                FOR c IN chunks
+                FILTER c.parent_id == p._id
+                LIMIT 1
+                RETURN 1
+            ) == []
+            RETURN {
+                _key: p._key,
+                _id: p._id,
+                anforandetext: p.anforandetext,
+                chunks: p.chunks
+            }
+        """,
+        batch_size=1000,
+        ttl=360,
+    )
+
+    n = 0
+    embed_batch_size = 20  # Number of chunks per Ollama call
+    chunk_batches: List[List[Dict]] = []
+
+    for talk in cursor:
+        talk_key = talk["_key"]
+        parent_id = f"talks/{talk_key}"
+
+        if talk.get("chunks"):
+            # Legacy path: chunks were previously generated and stored on the talk document.
+            # Strip out the old ChromaDB-specific fields and assign a proper _key.
+            _chunks = []
+            for chunk in talk["chunks"]:
+                idx = chunk.get("index", 0)
+                _chunks.append({
+                    "_key": f"{talk_key}:{idx}",
+                    "text": chunk["text"],
+                    "index": idx,
+                    "parent_id": parent_id,
+                    "collection": "talks",
+                })
+        else:
+            # New path: chunk the speech text directly with TextChunker.
+            text = (talk.get("anforandetext") or "").strip()
+            text_chunks = TextChunker(chunk_limit=500).chunk(text)
+            _chunks = [
+                {
+                    "_key": f"{talk_key}:{idx}",
+                    "text": content,
+                    "index": idx,
+                    "parent_id": parent_id,
+                    "collection": "talks",
+                }
+                for idx, content in enumerate(text_chunks)
+                if content and content.strip()
+            ]
+
+        # Split into batches for embedding
+        for i in range(0, len(_chunks), embed_batch_size):
+            batch = _chunks[i : i + embed_batch_size]
+            if batch:
+                chunk_batches.append(batch)
+
+    # Embed all batches in parallel (Ollama calls are I/O-bound, threads are fine)
+    total_batches = len(chunk_batches)
+    completed_batches = 0
+    with ThreadPoolExecutor(max_workers=3) as executor:
+        futures = [executor.submit(process_chunk_batch, batch) for batch in chunk_batches]
+        processed_chunks: List[Dict] = []
+        for future in as_completed(futures):
+            result = future.result()
+            completed_batches += 1
+            processed_chunks.extend(result)
+            print(f"Embedding batches: {completed_batches}/{total_batches} | chunks ready to insert: {len(processed_chunks)}", end="\r")
+            # Insert in batches of 100 to keep HTTP payloads small
+            if len(processed_chunks) >= 100:
+                n += len(processed_chunks)
+                chunks_collection.insert_many(processed_chunks, overwrite=True)
+                processed_chunks = []
+        if processed_chunks:
+            n += len(processed_chunks)
+            chunks_collection.insert_many(processed_chunks, overwrite=True)
+
+    print(f"\nDone. Inserted/updated {n} chunks in ArangoDB.")
+    return n
+
+
+if __name__ == "__main__":
+    make_arango_embeddings()
--- a/scripts/notes.md
+++ b/scripts/notes.md
@ -0,0 +1,5 @@
+### Inlogg riksdagsgruppen från Fojo-hackathon
+https://arango.lasseedfast.se  
+riksdagsgruppen  
+popre4-cygcuz-viHjyc  
+
--- a/scripts/sync_talks.py
+++ b/scripts/sync_talks.py
@ -0,0 +1,177 @@
+"""
+Synkroniserar nya anföranden från riksdagen.se till databasen och processar dem.
+
+Pipeline (körs dagligen via systemd timer):
+  1. Ladda ned årets anföranden från riksdagen.se (ersätter tidigare nerladdning)
+  2. Infoga nya anföranden i ArangoDB (hoppar över redan existerande)
+  3. Tilldela debatt-ID:n till anföranden som saknar det
+  4. Bygg embeddings för datum som saknar chunks
+  5. Generera sammanfattningar för datum som saknar summary
+
+Kör manuellt: python scripts/sync_talks.py
+"""
+
+import os
+import sys
+import logging
+from datetime import datetime
+from io import BytesIO
+from urllib.request import urlopen
+from zipfile import ZipFile
+
+# Säkerställ att vi kör från projektroten och att lokala moduler hittas
+os.chdir("/home/lasse/riksdagen")
+sys.path.append("/home/lasse/riksdagen")
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s [%(levelname)s] %(message)s",
+)
+logger = logging.getLogger(__name__)
+
+# Systemprompt som används av LLM:en vid sammanfattning av debatter
+SYSTEM_MESSAGE = """Din uppgift är att sammanfatta debatter i Sveriges riksdag. 
+Du kommer först att få enskilda tal som du ska sammanfatta var för sig, efter det ska du sammanfatta hela debatten.
+Sammanfattningarna ska vara på svenska och vara koncisa och informativa. 
+Det är viktigt att du förstår vad som är kärnan i varje tal och debatt, fokusera därför på de argument och sakförhållanden som framförs.
+"""
+
+
+def get_current_session_year() -> int:
+    """
+    Returnerar startåret för aktuell riksdagssession.
+
+    Riksdagssessionen löper september–augusti, så:
+      - Januari–Augusti 2026 → sessionen startade sep 2025 → returnerar 2025
+      - September–December 2025 → sessionen startade sep 2025 → returnerar 2025
+
+    Returns:
+        int: Fyrsiffrigt startår för aktuell session (t.ex. 2025).
+    """
+    now = datetime.now()
+    if now.month >= 9:
+        return now.year
+    else:
+        return now.year - 1
+
+
+def download_current_year(session_year: int) -> str:
+    """
+    Laddar ned och extraherar ZIP-arkivet för angiven riksdagssession,
+    och ersätter eventuella tidigare nerladdade filer för det året.
+
+    Riksdagen uppdaterar kontinuerligt samma ZIP-fil under pågående session,
+    så vi måste ladda ned den på nytt varje gång för att få med nya anföranden.
+
+    Args:
+        session_year (int): Sessionens startår (t.ex. 2025 för session 2025/26).
+
+    Returns:
+        str: Sökväg till katalogen dit filerna extraherades.
+    """
+    second_part = str(session_year + 1)[2:]  # t.ex. "26" för 2026
+    url = f"https://data.riksdagen.se/dataset/anforande/anforande-{session_year}{second_part}.json.zip"
+    folder_name = f"anforande-{session_year}{second_part}"
+    dir_path = os.path.join("talks", folder_name)
+
+    logger.info(f"Downloading {url} → {dir_path}")
+    os.makedirs(dir_path, exist_ok=True)
+
+    # Rensa gamla filer så vi får en färsk kopia
+    for f in os.listdir(dir_path):
+        os.remove(os.path.join(dir_path, f))
+
+    with urlopen(url) as resp:
+        with ZipFile(BytesIO(resp.read())) as zf:
+            zf.extractall(dir_path)
+
+    count = len(os.listdir(dir_path))
+    logger.info(f"Extracted {count} files to {dir_path}")
+    return dir_path
+
+
+def get_unsummarized_dates() -> list[str]:
+    """
+    Hämtar datum från ArangoDB som har anföranden utan sammanfattning.
+
+    Returns:
+        list[str]: Sorterad lista med datumsträngar, t.ex. ["2026-02-10", "2026-02-11"].
+    """
+    from arango_client import arango
+
+    cursor = arango.db.aql.execute(
+        """
+        FOR doc IN talks
+        FILTER doc.summary == null
+        RETURN DISTINCT doc.datum
+        """,
+        ttl=300,
+    )
+    dates = sorted(list(cursor))
+    logger.info(f"Found {len(dates)} dates with unsummarized talks")
+    return dates
+
+
+def sync() -> None:
+    """
+    Kör hela sync-pipelinen:
+      1. Ladda ned årets anföranden
+      2. Infoga nya anföranden i ArangoDB
+      3. Tilldela debatt-ID:n
+      4. Bygg embeddings för nya datum
+      5. Generera sammanfattningar för nya datum
+    """
+    logger.info("=== Starting daily riksdagen sync ===")
+
+    # --- Steg 1: Ladda ned ---
+    session_year = get_current_session_year()
+    logger.info(f"Current session year: {session_year}/{session_year + 1}")
+    dir_path = download_current_year(session_year)
+
+    # --- Steg 2: Infoga nya anföranden i ArangoDB ---
+    # update_folder() hämtar alla befintliga _key:s från databasen och hoppar
+    # över dem, så enbart nya anföranden infogas.
+    logger.info("Stage 2: Inserting new talks into ArangoDB...")
+    from scripts.documents_to_arango import update_folder
+
+    new_talks = update_folder(os.path.abspath(dir_path))
+    logger.info(f"Stage 2 complete: {new_talks} new talks inserted")
+
+    # --- Steg 3: Tilldela debatt-ID:n ---
+    # Anföranden som saknar fältet 'debate' grupperas i debatter baserat på
+    # datum och om de är repliker eller ej.
+    logger.info("Stage 3: Assigning debate IDs to talks missing them...")
+    from scripts.debates import make_debate_ids
+
+    make_debate_ids()
+    logger.info("Stage 3 complete")
+
+    # --- Steg 4: Chunk + bygg embeddings i ArangoDB ---
+    # make_arango_embeddings() hittar alla anföranden som saknar chunks i
+    # 'chunks'-kollektionen, chunkar texten, genererar vektorer via Ollama
+    # och lagrar allt direkt i ArangoDB. ChromaDB används inte.
+    logger.info("Stage 4: Chunking and embedding new talks into ArangoDB...")
+    from scripts.make_arango_embeddings import make_arango_embeddings
+
+    total_chunks = make_arango_embeddings()
+    logger.info(f"Stage 4 complete: {total_chunks} chunks created")
+
+    # --- Steg 5: Generera sammanfattningar ---
+    # process_debate_date() hoppar automatiskt över anföranden som redan har
+    # en sammanfattning, så det är säkert att köra igen.
+    new_dates = get_unsummarized_dates()
+    if new_dates:
+        logger.info(f"Stage 5: Generating summaries for {len(new_dates)} dates...")
+        from scripts.debates import process_debate_date
+
+        for date in new_dates:
+            process_debate_date(date, SYSTEM_MESSAGE)
+        logger.info(f"Stage 5 complete: summaries generated for {len(new_dates)} dates")
+    else:
+        logger.info("Stage 5: No unsummarized dates, skipping")
+
+    logger.info("=== Sync complete ===")
+
+
+if __name__ == "__main__":
+    sync()
--- a/scripts/test_make_arango_embeddings.py
+++ b/scripts/test_make_arango_embeddings.py
@ -0,0 +1,57 @@
+from arango_client import arango
+from scripts.make_arango_embeddings import process_chunk_batch
+from arango.collection import Collection
+from typing import List, Dict
+
+def test_full_make_arango_embeddings_for_one_talk() -> None:
+    """
+    Integration test for the full make_arango_embeddings chain:
+    - Fetches a specific talk document from ArangoDB.
+    - Processes its chunks to generate embeddings.
+    - Inserts/updates those chunks in the 'chunks' collection.
+    - Verifies that the chunks were updated in ArangoDB.
+
+    This test requires ArangoDB and Ollama to be running and accessible.
+    """
+    # The _id of the talk we want to process
+    target_id: str = "talks/000004cc-b896-e611-9441-00262d0d7125"
+    _key = target_id.split("/")[-1]
+
+    # Get the talks and chunks collections
+    talks_collection: Collection = arango.db.collection("talks")
+    chunks_collection: Collection = arango.db.collection("chunks")
+
+    # Fetch the talk document
+    talk: Dict = talks_collection.get(target_id)
+    assert talk is not None, f"Talk with _id {target_id} not found"
+    assert "chunks" in talk and talk["chunks"], "Talk has no chunks"
+
+    # Prepare chunks for embedding
+    processed_chunks: List[Dict] = []
+    for chunk in talk["chunks"]:
+        key: str = chunk["chroma_id"].split("/")[-1]
+        chunk["_key"] = key.split(":")[-1]
+        chunk["parent_id"] = target_id
+        chunk["collection"] = "talks"
+        # Remove fields not needed for embedding
+        if "chroma_id" in chunk:
+            del chunk["chroma_id"]
+        if "chroma_collecton" in chunk:
+            del chunk["chroma_collecton"]
+        processed_chunks.append(chunk)
+
+    # Generate embeddings for all chunks
+    processed_chunks = process_chunk_batch(processed_chunks)
+
+    # Insert/update chunks in the 'chunks' collection
+    chunks_collection.insert_many(processed_chunks, overwrite=True)
+
+    # Verify that the chunks were updated in ArangoDB
+    for chunk in processed_chunks:
+        db_chunk = chunks_collection.get(chunk["_key"])
+        assert db_chunk is not None, f"Chunk {_key} not found in DB"
+        assert "embedding" in db_chunk, "Chunk missing embedding in DB"
+        assert isinstance(db_chunk["embedding"], list), "Embedding is not a list"
+        print(f"Chunk {chunk['_key']} updated with embedding of length {len(db_chunk['embedding'])}")
+
+test_full_make_arango_embeddings_for_one_talk()
--- a/70
+++ b/70
@ -0,0 +1,70 @@
+import requests
+import time
+import sys
+import base64
+
+# Adjust if your server is remote
+VLLM_URL = "http://localhost:8010/v1/chat/completions"
+
+# Path to your image file
+IMAGE_PATH = "page_063.png"
+
+# Read and encode the image
+with open(IMAGE_PATH, "rb") as img_file:
+    image_data = img_file.read()
+
+# Convert image to base64
+image_base64 = base64.b64encode(image_data).decode("utf-8")
+
+# Prepare the messages
+messages = [
+    {"role": "system", "content": "You are a helpful assistant."},
+    {"role": "user", "content": "Describe the content of this image."},
+    {
+        "role": "user",
+        "content": [
+            {"type": "text", "text": "Please analyze the following image."},
+            {
+                "type": "image_url",
+                "image_url": {
+                    "url": f"data:image/png;base64,{image_base64}",
+                    "detail": "high"
+                }
+            }
+        ]
+    }
+]
+
+# Number of test iterations
+N = 10
+
+def test_vllm():
+    print(f"Starting vLLM image input test on {VLLM_URL}")
+    for i in range(1, N + 1):
+        payload = {
+            "model": "openbmb/MiniCPM-V-4_5-AWQ",
+            "messages": messages,
+            "max_tokens": 256,
+            "temperature": 0.7,
+        }
+
+        t0 = time.time()
+        try:
+            resp = requests.post(VLLM_URL, json=payload, timeout=120)
+            resp.raise_for_status()
+            data = resp.json()
+            output = data.get("choices", [{}])[0].get("message", {}).get("content", "")
+            print(output)
+            elapsed = time.time() - t0
+            print(f"[{i}/{N}] ✅ Response OK in {elapsed:.2f}s, output length={len(output)}")
+        except Exception as e:
+            print(f"[{i}/{N}] ❌ Error: {e}")
+            if "connection" in str(e).lower() or "timeout" in str(e).lower():
+                print("⚠️ Possible GPU hang or server crash. Stopping test.")
+                sys.exit(1)
+        time.sleep(1)  # small delay between requests
+
+    print("✅ Test completed successfully.")
+
+if __name__ == "__main__":
+    test_vllm()