WP15 #9
|
|
@ -1,124 +1,198 @@
|
|||
version: 1.3 # Update für Smart Edge Allocation
|
||||
version: 1.4 # Merge WP-15 (Smart Edges) & WP-07 (Schemas)
|
||||
|
||||
# ==============================================================================
|
||||
# 1. CHUNKING PROFILES (WP-15 Smart Edge Allocation)
|
||||
# ==============================================================================
|
||||
# Diese Profile steuern, wie Texte zerlegt und ob sie semantisch angereichert werden.
|
||||
|
||||
# --- CHUNKING DEFINITIONEN ---
|
||||
# Hier definieren wir die technischen Strategien und den Smart Edge Filter.
|
||||
chunking_profiles:
|
||||
|
||||
# 1. Standard Profile (Sliding Window, KEIN LLM-Filter)
|
||||
# A. Standard / Schnell (für einfache Quellen, Logs)
|
||||
# - Strategie: Sliding Window
|
||||
# - LLM-Filter: AUS (spart Kosten/Zeit)
|
||||
sliding_short:
|
||||
strategy: sliding_window
|
||||
enable_smart_edge_allocation: false # Sekundärverfeinerung deaktiviert
|
||||
enable_smart_edge_allocation: false
|
||||
target: 200
|
||||
max: 350
|
||||
overlap: [30, 50]
|
||||
|
||||
# 2. Smart Edge Allocation Profile (Sliding Window + LLM-Filter)
|
||||
# B. Smart Flow (für Konzepte, Journal, Projekte)
|
||||
# - Strategie: Sliding Window (für flüssigen Text)
|
||||
# - LLM-Filter: AN (verteilt Kanten intelligent auf Absätze)
|
||||
sliding_smart_edges:
|
||||
strategy: sliding_window # Primärzerlegung: Sliding Window
|
||||
enable_smart_edge_allocation: true # SEKUNDÄRVERFEINERUNG: LLM-Filter aktiv
|
||||
strategy: sliding_window
|
||||
enable_smart_edge_allocation: true
|
||||
target: 400
|
||||
max: 600
|
||||
overlap: [50, 80]
|
||||
|
||||
# 3. Strukturierte Profile (By Heading, KEIN LLM-Filter)
|
||||
structured_strict:
|
||||
strategy: by_heading
|
||||
enable_smart_edge_allocation: false
|
||||
split_level: 2
|
||||
max: 600
|
||||
target: 400
|
||||
overlap: [50, 80]
|
||||
|
||||
# 4. Strukturierte Profile (By Heading + LLM-Filter)
|
||||
# C. Smart Structure (für Profile, Werte, Entscheidungen)
|
||||
# - Strategie: By Heading (Harte Trennung an Überschriften)
|
||||
# - LLM-Filter: AN (verteilt Kanten auf Sektionen)
|
||||
structured_smart_edges:
|
||||
strategy: by_heading # Primärzerlegung: Harte Trennung
|
||||
enable_smart_edge_allocation: true # SEKUNDÄRVERFEINERUNG: LLM-Filter aktiv
|
||||
split_level: 2
|
||||
strategy: by_heading
|
||||
enable_smart_edge_allocation: true
|
||||
split_level: 2 # Trennt an H2 (##)
|
||||
max: 600
|
||||
target: 400
|
||||
overlap: [50, 80]
|
||||
|
||||
overlap: [50, 80] # Fallback
|
||||
|
||||
# ==============================================================================
|
||||
# 2. DEFAULTS
|
||||
# ==============================================================================
|
||||
defaults:
|
||||
retriever_weight: 1.0
|
||||
chunking_profile: sliding_standard # Fallback Profil
|
||||
chunking_profile: sliding_smart_edges # Fallback: Immer smart versuchen
|
||||
edge_defaults: []
|
||||
|
||||
# ==============================================================================
|
||||
# 3. TYPE DEFINITIONS
|
||||
# ==============================================================================
|
||||
# Hier werden Chunking, Retrieval-Gewichtung und GENERIERUNGS-SCHEMATA definiert.
|
||||
|
||||
types:
|
||||
|
||||
# --- WISSENSBAUSTEINE ---
|
||||
|
||||
concept:
|
||||
chunking_profile: sliding_smart_edges # Nutzt Kantenfilterung
|
||||
chunking_profile: sliding_smart_edges
|
||||
retriever_weight: 0.60
|
||||
edge_defaults: ["references", "related_to"]
|
||||
schema: # WP-07: Anleitung für LLM zur Erstellung
|
||||
- "Definition & Kernidee"
|
||||
- "Kontext & Hintergrund"
|
||||
- "Anwendungsbeispiele"
|
||||
- "Verwandte Konzepte"
|
||||
|
||||
source:
|
||||
chunking_profile: sliding_short # Kein LLM-Filter
|
||||
chunking_profile: sliding_short # Keine Smart Edges nötig (spart Ressourcen)
|
||||
retriever_weight: 0.50
|
||||
edge_defaults: []
|
||||
schema:
|
||||
- "Metadaten (Autor, URL, Datum)"
|
||||
- "Zusammenfassung (Key Takeaways)"
|
||||
- "Wichtige Zitate"
|
||||
- "Originaltext / Ausschnitte"
|
||||
|
||||
glossary:
|
||||
chunking_profile: sliding_short
|
||||
retriever_weight: 0.40
|
||||
edge_defaults: ["related_to"]
|
||||
schema:
|
||||
- "Begriffserklärung"
|
||||
- "Synonyme & Abgrenzung"
|
||||
|
||||
# --- IDENTITÄT & PERSÖNLICHKEIT ---
|
||||
|
||||
profile:
|
||||
chunking_profile: structured_smart_edges # Strukturiert + Kantenfilterung
|
||||
chunking_profile: structured_smart_edges # Struktur ist hier wichtig
|
||||
retriever_weight: 0.70
|
||||
edge_defaults: ["references", "related_to"]
|
||||
schema:
|
||||
- "Rolle & Beziehung"
|
||||
- "Wichtige Fakten & Daten"
|
||||
- "Gemeinsame Historie / Erfahrungen"
|
||||
- "Präferenzen & Werte"
|
||||
|
||||
value:
|
||||
chunking_profile: structured_smart_edges
|
||||
retriever_weight: 1.00
|
||||
retriever_weight: 1.00 # Höchste Priorität für die Decision Engine
|
||||
edge_defaults: ["related_to"]
|
||||
schema:
|
||||
- "Definition des Wertes"
|
||||
- "Warum ist das wichtig? (Motivation)"
|
||||
- "Leitsätze für Entscheidungen"
|
||||
- "Anti-Beispiele (Was wir vermeiden)"
|
||||
|
||||
principle:
|
||||
chunking_profile: structured_smart_edges
|
||||
retriever_weight: 0.95
|
||||
edge_defaults: ["derived_from", "references"]
|
||||
schema:
|
||||
- "Das Prinzip (Kernsatz)"
|
||||
- "Herleitung / Begründung"
|
||||
- "Anwendung in der Praxis"
|
||||
|
||||
belief:
|
||||
chunking_profile: sliding_short
|
||||
retriever_weight: 0.90
|
||||
edge_defaults: ["related_to"]
|
||||
schema:
|
||||
- "Glaubenssatz"
|
||||
- "Ursprung (Woher kommt das?)"
|
||||
- "Ist das noch hilfreich? (Reflexion)"
|
||||
|
||||
experience:
|
||||
chunking_profile: sliding_smart_edges
|
||||
retriever_weight: 0.90
|
||||
edge_defaults: ["derived_from", "references"]
|
||||
schema:
|
||||
- "Situation (Was ist passiert?)"
|
||||
- "Aktion (Was habe ich getan?)"
|
||||
- "Ergebnis (Was war die Folge?)"
|
||||
- "Learning (Was nehme ich mit?)"
|
||||
|
||||
# --- STRATEGIE & ENTSCHEIDUNG ---
|
||||
|
||||
goal:
|
||||
chunking_profile: sliding_smart_edges
|
||||
retriever_weight: 0.95
|
||||
edge_defaults: ["depends_on", "related_to"]
|
||||
schema:
|
||||
- "Zielsetzung (SMART)"
|
||||
- "Motivation (Warum?)"
|
||||
- "Erfolgskriterien (KPIs)"
|
||||
- "Meilensteine"
|
||||
|
||||
decision:
|
||||
chunking_profile: structured_smart_edges
|
||||
retriever_weight: 1.00
|
||||
edge_defaults: ["caused_by", "references"]
|
||||
schema:
|
||||
- "Kontext & Problemstellung"
|
||||
- "Betrachtete Optionen (Pros/Cons)"
|
||||
- "Die Entscheidung"
|
||||
- "Begründung (Warum diese Wahl?)"
|
||||
- "Erwartete Konsequenzen"
|
||||
|
||||
risk:
|
||||
chunking_profile: sliding_short
|
||||
retriever_weight: 0.85
|
||||
edge_defaults: ["related_to", "blocks"]
|
||||
|
||||
milestone:
|
||||
chunking_profile: sliding_short
|
||||
retriever_weight: 0.70
|
||||
edge_defaults: ["related_to", "part_of"]
|
||||
schema:
|
||||
- "Risiko-Beschreibung"
|
||||
- "Eintrittswahrscheinlichkeit & Impact"
|
||||
- "Mitigations-Strategie (Plan B)"
|
||||
|
||||
# --- OPERATIV ---
|
||||
|
||||
project:
|
||||
chunking_profile: sliding_smart_edges
|
||||
retriever_weight: 0.97
|
||||
edge_defaults: ["references", "depends_on"]
|
||||
schema:
|
||||
- "Mission / Zielsetzung"
|
||||
- "Aktueller Status"
|
||||
- "Nächste Schritte (Next Actions)"
|
||||
- "Offene Fragen / Blocker"
|
||||
- "Referenzen (Links)"
|
||||
|
||||
task:
|
||||
chunking_profile: sliding_short
|
||||
retriever_weight: 0.80
|
||||
edge_defaults: ["depends_on", "part_of"]
|
||||
schema:
|
||||
- "Aufgabe"
|
||||
- "Kontext / Wichtigkeit"
|
||||
- "Definition of Done"
|
||||
|
||||
journal:
|
||||
chunking_profile: sliding_smart_edges # Fließtext + Kantenfilterung
|
||||
chunking_profile: sliding_smart_edges
|
||||
retriever_weight: 0.80
|
||||
edge_defaults: ["references", "related_to"]
|
||||
edge_defaults: ["references", "related_to"]
|
||||
schema:
|
||||
- "Tages-Log / Ereignisse"
|
||||
- "Erkenntnisse & Gedanken"
|
||||
- "Entscheidungen des Tages"
|
||||
- "Fokus für Morgen"
|
||||
Loading…
Reference in New Issue
Block a user