From fb4a1bc702c5482f6c974949171e46202ea3a146 Mon Sep 17 00:00:00 2001
From: Lars <Lars@stommer.de>
Date: Wed, 3 Sep 2025 07:56:45 +0200
Subject: [PATCH] =?UTF-8?q?app/core/embed.py=20hinzugef=C3=BCgt?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 app/core/embed.py | 42 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 42 insertions(+)
 create mode 100644 app/core/embed.py

diff --git a/app/core/embed.py b/app/core/embed.py
new file mode 100644
index 0000000..83714b6
--- /dev/null
+++ b/app/core/embed.py
@@ -0,0 +1,42 @@
+from __future__ import annotations
+import os, time, json
+import urllib.request
+from typing import List, Dict, Any
+
+EMBED_URL = os.getenv("EMBED_URL", "http://127.0.0.1:8990/embed")
+EMBED_MODEL = os.getenv("EMBED_MODEL", "minilm-384")
+EMBED_BATCH = int(os.getenv("EMBED_BATCH", "64"))
+TIMEOUT = 60
+
+class EmbedError(RuntimeError): ...
+
+def _post_json(url: str, payload: Dict[str, Any]) -> Dict[str, Any]:
+    data = json.dumps(payload).encode("utf-8")
+    req = urllib.request.Request(url, data=data, headers={"Content-Type": "application/json"})
+    with urllib.request.urlopen(req, timeout=TIMEOUT) as resp:
+        return json.loads(resp.read().decode("utf-8"))
+
+def embed_texts(texts: List[str], model: str | None = None, batch_size: int | None = None) -> List[List[float]]:
+    model = model or EMBED_MODEL
+    batch = batch_size or EMBED_BATCH
+    out: List[List[float]] = []
+    i = 0
+    while i < len(texts):
+        chunk = texts[i:i+batch]
+        # einfache Retries bei 429/500er
+        for attempt in range(5):
+            try:
+                resp = _post_json(EMBED_URL, {"model": model, "inputs": chunk})
+                vecs = resp.get("embeddings") or resp.get("vectors") or resp.get("data")
+                if not isinstance(vecs, list): raise EmbedError(f"Bad embed response keys: {resp.keys()}")
+                out.extend(vecs)
+                break
+            except Exception as e:
+                if attempt == 4: raise
+                time.sleep(1.5 * (attempt + 1))
+                continue
+        i += batch
+    return out
+
+def embed_one(text: str, model: str | None = None) -> List[float]:
+    return embed_texts([text], model=model, batch_size=1)[0]