types angepasst

2025-12-12 13:19:28 +01:00 · 2025-12-12 13:19:28 +01:00 · 1e3fcc1633
commit 1e3fcc1633
parent 0d28a6c1a7
1 changed files with 97 additions and 135 deletions
--- a/config/types.yaml
+++ b/config/types.yaml
@ -1,198 +1,160 @@
-version: 1.4 # Merge WP-15 (Smart Edges) & WP-07 (Schemas)
+version: 1.6 # Balance zwischen Speed, Kontext und Smartness

 # ==============================================================================
-# 1. CHUNKING PROFILES (WP-15 Smart Edge Allocation)
+# 1. CHUNKING PROFILES
 # ==============================================================================
-# Diese Profile steuern, wie Texte zerlegt und ob sie semantisch angereichert werden.

 chunking_profiles:
  
-  # A. Standard / Schnell (für einfache Quellen, Logs)
-  # - Strategie: Sliding Window
-  # - LLM-Filter: AUS (spart Kosten/Zeit)
+  # A. SHORT & FAST (Für atomare Schnipsel)
+  # Einsatz: Glossar, Tasks, Risiken
+  # Vorteil: Präzise Treffer für kurze Infos.
  sliding_short:
    strategy: sliding_window
-    enable_smart_edge_allocation: false 
+    enable_smart_edge_allocation: false # AUS (Speed)
    target: 200
    max: 350
    overlap: [30, 50]

-  # B. Smart Flow (für Konzepte, Journal, Projekte)
-  # - Strategie: Sliding Window (für flüssigen Text)
-  # - LLM-Filter: AN (verteilt Kanten intelligent auf Absätze)
+  # B. STANDARD & FAST (Der neue "Mittelweg")
+  # Einsatz: Quellen, Journal, Daily Logs
+  # Vorteil: Viel Kontext für RAG, aber rasendschneller Import ohne LLM.
+  sliding_standard:
+    strategy: sliding_window
+    enable_smart_edge_allocation: false # AUS (Speed)
+    target: 450  # Größerer Kontext!
+    max: 650
+    overlap: [50, 100]
+
+  # C. SMART FLOW (Premium Chunking)
+  # Einsatz: Konzepte, Projekte, Erfahrungen
+  # Vorteil: LLM prüft Inhalt und verlinkt präzise. Kostet Zeit.
  sliding_smart_edges:
    strategy: sliding_window
-    enable_smart_edge_allocation: true
+    enable_smart_edge_allocation: true # AN (Intelligenz)
    target: 400
    max: 600
    overlap: [50, 80]

-  # C. Smart Structure (für Profile, Werte, Entscheidungen)
-  # - Strategie: By Heading (Harte Trennung an Überschriften)
-  # - LLM-Filter: AN (verteilt Kanten auf Sektionen)
+  # D. SMART STRUCTURE
+  # Einsatz: Profile, Werte, Prinzipien
+  # Vorteil: Respektiert die Markdown-Struktur (H2).
  structured_smart_edges:
    strategy: by_heading
-    enable_smart_edge_allocation: true
-    split_level: 2 # Trennt an H2 (##)
+    enable_smart_edge_allocation: true # AN (Intelligenz)
+    split_level: 2
    max: 600
    target: 400
-    overlap: [50, 80] # Fallback
+    overlap: [50, 80]

 # ==============================================================================
 # 2. DEFAULTS
 # ==============================================================================
 defaults:
  retriever_weight: 1.0
-  chunking_profile: sliding_smart_edges # Fallback: Immer smart versuchen
+  chunking_profile: sliding_standard # Fallback auf Standard (sicher & performant)
  edge_defaults: [] 

 # ==============================================================================
 # 3. TYPE DEFINITIONS
 # ==============================================================================
-# Hier werden Chunking, Retrieval-Gewichtung und GENERIERUNGS-SCHEMATA definiert.

 types:

-  # --- WISSENSBAUSTEINE ---
-
-  concept:
-    chunking_profile: sliding_smart_edges
-    retriever_weight: 0.60
-    edge_defaults: ["references", "related_to"]
-    schema: # WP-07: Anleitung für LLM zur Erstellung
-      - "Definition & Kernidee"
-      - "Kontext & Hintergrund"
-      - "Anwendungsbeispiele"
-      - "Verwandte Konzepte"
+  # --- MASSENDATEN (Speed + Kontext) ---

  source:
-    chunking_profile: sliding_short # Keine Smart Edges nötig (spart Ressourcen)
+    chunking_profile: sliding_standard # JETZT: Mehr Kontext (450 Token), trotzdem schnell
    retriever_weight: 0.50
    edge_defaults: [] 
    schema:
      - "Metadaten (Autor, URL, Datum)"
-      - "Zusammenfassung (Key Takeaways)"
-      - "Wichtige Zitate"
+      - "Zusammenfassung"
      - "Originaltext / Ausschnitte"

-  glossary:
-    chunking_profile: sliding_short
-    retriever_weight: 0.40
-    edge_defaults: ["related_to"]
-    schema:
-      - "Begriffserklärung"
-      - "Synonyme & Abgrenzung"
-
-  # --- IDENTITÄT & PERSÖNLICHKEIT ---
-
-  profile:
-    chunking_profile: structured_smart_edges # Struktur ist hier wichtig
-    retriever_weight: 0.70
+  journal:
+    chunking_profile: sliding_standard # JETZT: Mehr Kontext für Tagebucheinträge
+    retriever_weight: 0.80
    edge_defaults: ["references", "related_to"]
    schema:
-      - "Rolle & Beziehung"
-      - "Wichtige Fakten & Daten"
-      - "Gemeinsame Historie / Erfahrungen"
-      - "Präferenzen & Werte"
+      - "Tages-Log"
+      - "Erkenntnisse"
+      - "Entscheidungen"

-  value:
-    chunking_profile: structured_smart_edges
-    retriever_weight: 1.00 # Höchste Priorität für die Decision Engine
+  # --- ATOMARE DATEN (Speed + Präzision) ---
+
+  task:
+    chunking_profile: sliding_short # Kurz halten
+    retriever_weight: 0.80
+    edge_defaults: ["depends_on", "part_of"]
+    schema: ["Aufgabe", "Kontext", "DoD"]
+
+  glossary:
+    chunking_profile: sliding_short # Kurz halten
+    retriever_weight: 0.40
    edge_defaults: ["related_to"]
-    schema:
-      - "Definition des Wertes"
-      - "Warum ist das wichtig? (Motivation)"
-      - "Leitsätze für Entscheidungen"
-      - "Anti-Beispiele (Was wir vermeiden)"
-
-  principle:
-    chunking_profile: structured_smart_edges
-    retriever_weight: 0.95
-    edge_defaults: ["derived_from", "references"]
-    schema:
-      - "Das Prinzip (Kernsatz)"
-      - "Herleitung / Begründung"
-      - "Anwendung in der Praxis"
-
-  belief:
-    chunking_profile: sliding_short
-    retriever_weight: 0.90
-    edge_defaults: ["related_to"]
-    schema:
-      - "Glaubenssatz"
-      - "Ursprung (Woher kommt das?)"
-      - "Ist das noch hilfreich? (Reflexion)"
-
-  experience:
-    chunking_profile: sliding_smart_edges
-    retriever_weight: 0.90
-    edge_defaults: ["derived_from", "references"]
-    schema:
-      - "Situation (Was ist passiert?)"
-      - "Aktion (Was habe ich getan?)"
-      - "Ergebnis (Was war die Folge?)"
-      - "Learning (Was nehme ich mit?)"
-
-  # --- STRATEGIE & ENTSCHEIDUNG ---
-
-  goal:
-    chunking_profile: sliding_smart_edges
-    retriever_weight: 0.95
-    edge_defaults: ["depends_on", "related_to"]
-    schema:
-      - "Zielsetzung (SMART)"
-      - "Motivation (Warum?)"
-      - "Erfolgskriterien (KPIs)"
-      - "Meilensteine"
-
-  decision:
-    chunking_profile: structured_smart_edges 
-    retriever_weight: 1.00
-    edge_defaults: ["caused_by", "references"]
-    schema:
-      - "Kontext & Problemstellung"
-      - "Betrachtete Optionen (Pros/Cons)"
-      - "Die Entscheidung"
-      - "Begründung (Warum diese Wahl?)"
-      - "Erwartete Konsequenzen"
+    schema: ["Begriff", "Definition"]

  risk:
    chunking_profile: sliding_short
    retriever_weight: 0.85
    edge_defaults: ["related_to", "blocks"]
-    schema:
-      - "Risiko-Beschreibung"
-      - "Eintrittswahrscheinlichkeit & Impact"
-      - "Mitigations-Strategie (Plan B)"
+    schema: ["Beschreibung", "Mitigation"]

-  # --- OPERATIV ---
+  belief:
+    chunking_profile: sliding_short
+    retriever_weight: 0.90
+    edge_defaults: ["related_to"]
+    schema: ["Glaubenssatz", "Reflexion"]
+
+  # --- KERN-WISSEN (Smart Edges / LLM Active) ---
+
+  concept:
+    chunking_profile: sliding_smart_edges
+    retriever_weight: 0.60
+    edge_defaults: ["references", "related_to"]
+    schema:
+      - "Definition"
+      - "Kontext"
+      - "Verwandte Konzepte"

  project:
    chunking_profile: sliding_smart_edges
    retriever_weight: 0.97
    edge_defaults: ["references", "depends_on"] 
    schema:
-      - "Mission / Zielsetzung"
-      - "Aktueller Status"
-      - "Nächste Schritte (Next Actions)"
-      - "Offene Fragen / Blocker"
-      - "Referenzen (Links)"
+      - "Mission"
+      - "Status"
+      - "Next Actions"

-  task:
-    chunking_profile: sliding_short
-    retriever_weight: 0.80
-    edge_defaults: ["depends_on", "part_of"]
-    schema:
-      - "Aufgabe"
-      - "Kontext / Wichtigkeit"
-      - "Definition of Done"
-
-  journal:
+  experience:
    chunking_profile: sliding_smart_edges
-    retriever_weight: 0.80
+    retriever_weight: 0.90
+    edge_defaults: ["derived_from", "references"]
+    schema: ["Situation", "Aktion", "Ergebnis", "Learning"]
+
+  # --- STRUKTUR-DATEN (Smart Structure / LLM Active) ---
+
+  profile:
+    chunking_profile: structured_smart_edges
+    retriever_weight: 0.70
    edge_defaults: ["references", "related_to"]
-    schema:
-      - "Tages-Log / Ereignisse"
-      - "Erkenntnisse & Gedanken"
-      - "Entscheidungen des Tages"
-      - "Fokus für Morgen"
+    schema: ["Rolle", "Fakten", "Historie"]
+
+  value:
+    chunking_profile: structured_smart_edges
+    retriever_weight: 1.00
+    edge_defaults: ["related_to"]
+    schema: ["Definition", "Motivation", "Leitsätze"]
+
+  principle:
+    chunking_profile: structured_smart_edges
+    retriever_weight: 0.95
+    edge_defaults: ["derived_from", "references"]
+    schema: ["Prinzip", "Anwendung"]
+
+  decision:
+    chunking_profile: structured_smart_edges 
+    retriever_weight: 1.00
+    edge_defaults: ["caused_by", "references"]
+    schema: ["Problem", "Optionen", "Entscheidung", "Warum"]