working on ingestion

2026-02-19 11:54:31 +01:00 · 2026-02-19 11:54:31 +01:00 · 51488b3ee6
parent 1a77b84921
commit 51488b3ee6
6 changed files with 856 additions and 54 deletions
--- a/Docker/docker-compose.yaml
+++ b/Docker/docker-compose.yaml
@ -14,6 +14,7 @@ services:
      LANGFUSE_PUBLIC_KEY: ${LANGFUSE_PUBLIC_KEY}
      LANGFUSE_SECRET_KEY: ${LANGFUSE_SECRET_KEY}
      ELASTICSEARCH_INDEX: ${ELASTICSEARCH_INDEX}
+      OLLAMA_MODEL_NAME: ${OLLAMA_MODEL_NAME}
    
    extra_hosts:
      - "host.docker.internal:host-gateway"
--- a/Docker/src/server.py
+++ b/Docker/src/server.py
@ -19,14 +19,14 @@ class BrunixEngine(brunix_pb2_grpc.AssistanceEngineServicer):
    def __init__(self):

        self.base_url = os.getenv("LLM_BASE_URL", "http://ollama-light-service:11434")
-        self.model_name = os.getenv("LLM_MODEL", "qwen2.5:1.5b")
+        self.model_name = os.getenv("OLLAMA_MODEL_NAME")

        logger.info(f"Starting server")

        self.llm = Ollama(base_url=self.base_url, model=self.model_name)

        self.embeddings = OllamaEmbeddings(
-            base_url=self.base_url, model="qwen3-embedding:0.6b"
+            base_url=self.base_url, model=self.model_name
        )

        es_url = os.getenv("ELASTICSEARCH_URL", "http://elasticsearch:9200")
@ -40,7 +40,7 @@ class BrunixEngine(brunix_pb2_grpc.AssistanceEngineServicer):
            vector_query_field="embedding",
        )

-    def format_context(docs) -> str:
+    def format_context(self, docs) -> str:
        parts = []
        for i, d in enumerate(docs, start=1):
            meta = d.metadata or {}
@ -76,11 +76,9 @@ class BrunixEngine(brunix_pb2_grpc.AssistanceEngineServicer):

            chain = prompt | self.llm

-            for chunk in chain.stream(
-                {"context": context_text, "question": request.query}
-            ):
+            result = chain.invoke({"context": context_text, "question": request.query})
            yield brunix_pb2.AgentResponse(
-                    text=str(chunk), avap_code="AVAP-2026", is_final=False
+                text=str(result), avap_code="AVAP-2026", is_final=True
            )

            yield brunix_pb2.AgentResponse(text="", avap_code="", is_final=True)
--- a/7
+++ b/7
@ -20,3 +20,10 @@ compose_up:
 	sleep 2
 	docker compose -f Docker/docker-compose.yaml --env-file .env up -d --build
 	@echo "✓ Done!"
+
+# Kill all kubectl port-forward tunnels
+.PHONY: tunnels_down
+tunnels_down:
+	@echo "Killing all kubectl port-forward tunnels..."
+	-pkill -f 'kubectl port-forward' || true
+	@echo "✓ All tunnels killed!"
--- a/scratches/pseco/ingestion/n00
+++ b/scratches/pseco/ingestion/n00
--- a/scratches/pseco/ingestion/n00
+++ b/scratches/pseco/ingestion/n00
--- a/scratches/pseco/ingestion/n00
+++ b/scratches/pseco/ingestion/n00
@ -0,0 +1,153 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9949107c",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'http://host.docker.internal:11434'"
+      ]
+     },
+     "execution_count": 1,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from langchain_community.embeddings import OllamaEmbeddings\n",
+    "import os\n",
+    "from langchain_community.llms import Ollama\n",
+    "\n",
+    "os.getenv(\"LLM_BASE_URL\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 25,
+   "id": "458fd5c2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "embeddings = OllamaEmbeddings(\n",
+    "    base_url=\"http://localhost:11434\", model=\"qwen2.5:1.5b\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 26,
+   "id": "679cbf21",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "v = embeddings.embed_documents([\"hello world\", \"goodbye world\"])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "id": "ee9afd0c",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "list"
+      ]
+     },
+     "execution_count": 16,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "type(v)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "id": "5f85dc6f",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "1536"
+      ]
+     },
+     "execution_count": 18,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "len(v[0])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "1e8b8ecd",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/tmp/ipykernel_34744/3454453355.py:1: LangChainDeprecationWarning: The class `Ollama` was deprecated in LangChain 0.3.1 and will be removed in 1.0.0. An updated version of the class exists in the `langchain-ollama package and should be used instead. To use it run `pip install -U `langchain-ollama` and import as `from `langchain_ollama import OllamaLLM``.\n",
+      "  llm = Ollama(base_url=\"http://localhost:11434\", model=\"qwen2.5:1.5b\")\n"
+     ]
+    }
+   ],
+   "source": [
+    "llm = Ollama(base_url=\"http://localhost:11434\", model=\"qwen2.5:1.5b\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1db5f6e3",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Princilandia does not actually exist as a country or city on Earth. The term \"Princilandia\" appears to be made up or fictional and doesn't correspond to any real geographical location with an official capital.\n",
+      "\n",
+      "The correct answer would depend on which imaginary world you're referring to, but without that context, I can't provide the specific name of the capital for Princilandia. If you're interested in information about a country known as \"Princelandia\" or have another question about such places, please feel free to ask and I'd be happy to help!\n"
+     ]
+    }
+   ],
+   "source": [
+    "response = llm.invoke(\"\")\n",
+    "print(response)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "assistance-engine",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}