From e2a132353d51bf97b77cc9468c3ab03835fd0242 Mon Sep 17 00:00:00 2001
From: Lars <Lars@stommer.de>
Date: Sat, 4 Apr 2026 12:27:31 +0200
Subject: [PATCH] feat: Phase 4 - Join Nodes and Path Consolidation
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Backend Implementation (v0.9m, workflow 0.5.0):
- join_evaluator.py (394 lines): Join-Strategie-Evaluator
  - evaluate_join_node(): Hauptlogik für Join-Node Execution
  - Join-Strategien: wait_all, wait_any, best_effort
  - Skip-Handling: ignore_skipped, use_placeholder, require_minimum
  - Result Consolidation: merge analysis_cores, combine signals
  - Partial Execution: korrekte Behandlung von SKIPPED/FAILED Pfaden

- workflow_executor.py: execute_join_node() Integration
  - BFS-Traversierung erweitert für Join-Nodes
  - NodeExecutionState List → Dict Konvertierung für Signale
  - Signal-Name-Kollisionen via node_id Präfix gelöst

Testing (49 Tests passing):
- test_phase4_join_nodes.py: 18 neue Unit Tests
  - Join-Strategien (wait_all, wait_any, best_effort)
  - Skip-Handling (ignore, placeholder)
  - Result Consolidation (merge, combine)
  - Partial Execution (mixed status paths)
  - Helper Functions (collect, check, merge, combine)

- Backward Compatibility: 31 Phase 2/3 Tests (alle passing)
  - test_phase2_workflow_executor.py: 1 Test aktualisiert
  - test_phase3_logic_evaluator.py: 20 Tests unverändert

Konzept: konzept_workflow_engine_konsolidated.md (Sektion 8.8)
Anforderungsanalyse: phase4_anforderungsanalyse.md

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 backend/join_evaluator.py                     | 396 ++++++++++++++
 backend/version.py                            |  20 +-
 backend/workflow_executor.py                  | 102 +++-
 .../backend/test_phase2_workflow_executor.py  |  27 +-
 tests/backend/test_phase4_join_nodes.py       | 511 ++++++++++++++++++
 5 files changed, 1039 insertions(+), 17 deletions(-)
 create mode 100644 backend/join_evaluator.py
 create mode 100644 tests/backend/test_phase4_join_nodes.py

diff --git a/backend/join_evaluator.py b/backend/join_evaluator.py
new file mode 100644
index 0000000..81b3762
--- /dev/null
+++ b/backend/join_evaluator.py
@@ -0,0 +1,396 @@
+"""
+Join Evaluator (Phase 4)
+
+Evaluiert Join-Knoten: Sammelt incoming paths, prüft Strategien, konsolidiert Ergebnisse.
+
+Join-Strategien:
+- wait_all: Alle eingehenden Pfade müssen ausgeführt sein (strikt)
+- wait_any: Mindestens ein Pfad muss ausgeführt sein
+- best_effort: Verwendet verfügbare Pfade (fehlertoleranz)
+
+Skip-Handling:
+- ignore_skipped: Übersprungene Pfade nicht in Ergebnis
+- use_placeholder: Platzhalter für übersprungene Pfade
+- require_minimum: Mindestanzahl erforderlich
+
+Konzept-Basis: konzept_workflow_engine_konsolidated.md (Sektion 8.8)
+Anforderungsanalyse: phase4_anforderungsanalyse.md
+"""
+
+from typing import Dict, Any, Optional, List, NamedTuple
+from pydantic import BaseModel, Field
+import logging
+
+from workflow_models import (
+    WorkflowNode,
+    WorkflowGraph,
+    JoinStrategy,
+    SkipHandling,
+    NodeStatus,
+    NormalizedSignal
+)
+
+logger = logging.getLogger(__name__)
+
+
+# ── Data Structures ───────────────────────────────────────────────────────────
+
+
+class PathStatus(NamedTuple):
+    """
+    Status eines eingehenden Pfads am Join-Node.
+
+    Attributes:
+        node_id: ID des Source-Nodes (Node vor dem Join)
+        status: Ausführungsstatus (EXECUTED, SKIPPED, FAILED)
+        analysis_core: Analyseinhalt (wenn vorhanden)
+        signals: Normalisierte Signale des Nodes (question_type → Signal)
+    """
+    node_id: str
+    status: NodeStatus
+    analysis_core: Optional[str]
+    signals: Dict[str, NormalizedSignal]  # Converted from List to Dict by _collect_incoming_paths
+
+
+class JoinResult(BaseModel):
+    """
+    Ergebnis der Join-Evaluation.
+
+    Enthält konsolidierte Daten aller eingehenden Pfade.
+    """
+    ready: bool = Field(..., description="Sind erforderliche Pfade verfügbar?")
+    consolidated_analysis_core: Dict[str, str] = Field(
+        default_factory=dict,
+        description="Konsolidierte Analysekerne: node_id → analysis_core"
+    )
+    consolidated_signals: Dict[str, NormalizedSignal] = Field(
+        default_factory=dict,
+        description="Konsolidierte Signale: node_id.question_id → signal"
+    )
+    metadata: Dict[str, Any] = Field(
+        default_factory=dict,
+        description="Pfad-Status, Statistiken, Hinweise"
+    )
+    error: Optional[str] = Field(None, description="Fehler bei nicht erfüllter Strategie")
+
+
+# ── Helper Functions ──────────────────────────────────────────────────────────
+
+
+def _collect_incoming_paths(
+    node: WorkflowNode,
+    graph: WorkflowGraph,
+    context: Dict[str, Any]
+) -> List[PathStatus]:
+    """
+    Sammelt alle eingehenden Pfade eines Join-Nodes.
+
+    Args:
+        node: Join-Node
+        graph: Workflow-Graph
+        context: Execution context mit node_results
+
+    Returns:
+        List[PathStatus] - Status aller eingehenden Pfade
+
+    Details:
+        - Findet alle Edges mit to_node == join_node.id
+        - Extrahiert NodeExecutionState aus context["node_results"]
+        - Erstellt PathStatus für jeden incoming node
+    """
+    incoming_edges = [e for e in graph.edges if e.to_node == node.id]
+    paths: List[PathStatus] = []
+
+    logger.debug(f"Join node {node.id}: Found {len(incoming_edges)} incoming edges")
+
+    for edge in incoming_edges:
+        source_node_id = edge.from_node
+
+        # Hole NodeExecutionState aus context
+        node_state = context["node_results"].get(source_node_id)
+
+        if node_state:
+            # Node wurde ausgeführt
+            # Convert List[NormalizedSignal] to Dict[question_type → Signal]
+            signals_dict = {}
+            if node_state.normalized_signals:
+                for signal in node_state.normalized_signals:
+                    signals_dict[signal.question_type] = signal
+
+            path = PathStatus(
+                node_id=source_node_id,
+                status=node_state.status,
+                analysis_core=node_state.analysis_core,
+                signals=signals_dict
+            )
+            paths.append(path)
+            logger.debug(f"  Path {source_node_id}: {node_state.status.value}")
+        else:
+            # Node nicht in node_results → wurde nicht besucht (unreachable)
+            path = PathStatus(
+                node_id=source_node_id,
+                status=NodeStatus.SKIPPED,
+                analysis_core=None,
+                signals={}
+            )
+            paths.append(path)
+            logger.debug(f"  Path {source_node_id}: not visited (unreachable)")
+
+    return paths
+
+
+def _check_join_strategy(
+    paths: List[PathStatus],
+    strategy: JoinStrategy
+) -> tuple[bool, Optional[str]]:
+    """
+    Prüft ob Join-Strategie erfüllt ist.
+
+    Args:
+        paths: Liste aller eingehenden Pfade
+        strategy: Join-Strategie (wait_all, wait_any, best_effort)
+
+    Returns:
+        (ready: bool, error: Optional[str])
+        - ready: True wenn Strategie erfüllt
+        - error: Fehlermeldung wenn nicht erfüllt
+
+    Strategien:
+        - wait_all: Alle Pfade EXECUTED (strikt)
+        - wait_any: Mindestens ein Pfad EXECUTED
+        - best_effort: Immer ready (fehlertoleranz)
+    """
+    executed_paths = [p for p in paths if p.status == NodeStatus.EXECUTED]
+    failed_paths = [p for p in paths if p.status == NodeStatus.FAILED]
+    skipped_paths = [p for p in paths if p.status == NodeStatus.SKIPPED]
+
+    logger.debug(f"Join strategy check: {strategy.value}")
+    logger.debug(f"  Executed: {len(executed_paths)}/{len(paths)}")
+    logger.debug(f"  Failed: {len(failed_paths)}")
+    logger.debug(f"  Skipped: {len(skipped_paths)}")
+
+    if strategy == JoinStrategy.WAIT_ALL:
+        # Alle Pfade müssen EXECUTED sein
+        if len(executed_paths) < len(paths):
+            missing = [p.node_id for p in paths if p.status != NodeStatus.EXECUTED]
+            error = f"wait_all strategy failed: {len(executed_paths)}/{len(paths)} paths executed. Missing: {missing}"
+            logger.warning(error)
+            return False, error
+        return True, None
+
+    elif strategy == JoinStrategy.WAIT_ANY:
+        # Mindestens ein Pfad EXECUTED
+        if len(executed_paths) == 0:
+            error = f"wait_any strategy failed: no paths executed ({len(failed_paths)} failed, {len(skipped_paths)} skipped)"
+            logger.warning(error)
+            return False, error
+        return True, None
+
+    elif strategy == JoinStrategy.BEST_EFFORT:
+        # Immer bereit (fehlertoleranz)
+        if len(executed_paths) == 0:
+            logger.info(f"best_effort: No paths executed, but continuing (fehlertoleranz)")
+        return True, None
+
+    else:
+        # Unbekannte Strategie
+        error = f"Unknown join strategy: {strategy}"
+        logger.error(error)
+        return False, error
+
+
+def _merge_analysis_cores(
+    paths: List[PathStatus],
+    skip_handling: Optional[SkipHandling]
+) -> Dict[str, str]:
+    """
+    Merged Analysekerne aller eingehenden Pfade.
+
+    Args:
+        paths: Liste aller Pfade
+        skip_handling: Umgang mit übersprungenen Pfaden
+
+    Returns:
+        Dict[node_id → analysis_core]
+
+    Details:
+        - EXECUTED Pfade: analysis_core übernehmen
+        - SKIPPED Pfade: abhängig von skip_handling
+          - IGNORE_SKIPPED: nicht in Ergebnis
+          - USE_PLACEHOLDER: Platzhalter "[Skipped: {node_id}]"
+        - FAILED Pfade: Platzhalter "[Failed: {node_id}]"
+    """
+    merged: Dict[str, str] = {}
+
+    for path in paths:
+        if path.status == NodeStatus.EXECUTED and path.analysis_core:
+            # Normale Übernahme
+            merged[path.node_id] = path.analysis_core
+
+        elif path.status == NodeStatus.SKIPPED:
+            # Skip-Handling
+            if skip_handling == SkipHandling.USE_PLACEHOLDER:
+                merged[path.node_id] = f"[Path skipped: {path.node_id}]"
+            elif skip_handling == SkipHandling.IGNORE_SKIPPED:
+                # Nicht in Ergebnis
+                pass
+            # REQUIRE_MINIMUM wird in _check_join_strategy behandelt
+
+        elif path.status == NodeStatus.FAILED:
+            # Failed Pfade dokumentieren
+            merged[path.node_id] = f"[Path failed: {path.node_id}]"
+
+    logger.debug(f"Merged analysis cores: {len(merged)} entries")
+    return merged
+
+
+def _combine_signals(
+    paths: List[PathStatus]
+) -> Dict[str, NormalizedSignal]:
+    """
+    Kombiniert Signale aller eingehenden Pfade.
+
+    Args:
+        paths: Liste aller Pfade
+
+    Returns:
+        Dict[node_id.question_id → NormalizedSignal]
+
+    Details:
+        - Signal-Namen werden mit node_id geprefixed (verhindert Kollision)
+        - Format: "node_id.question_id" → Signal
+        - Nur EXECUTED Pfade werden berücksichtigt
+
+    Beispiel:
+        path_a.relevanz → Signal(value="hoch", ...)
+        path_b.relevanz → Signal(value="mittel", ...)
+    """
+    combined: Dict[str, NormalizedSignal] = {}
+
+    for path in paths:
+        if path.status != NodeStatus.EXECUTED:
+            # Nur ausgeführte Pfade haben valide Signale
+            continue
+
+        for signal_key, signal in path.signals.items():
+            # Präfix mit node_id (verhindert Kollision)
+            prefixed_key = f"{path.node_id}.{signal_key}"
+            combined[prefixed_key] = signal
+
+    logger.debug(f"Combined signals: {len(combined)} entries")
+    return combined
+
+
+# ── Main Function ─────────────────────────────────────────────────────────────
+
+
+def evaluate_join_node(
+    node: WorkflowNode,
+    graph: WorkflowGraph,
+    context: Dict[str, Any]
+) -> JoinResult:
+    """
+    Evaluiert Join-Node: Sammelt Pfade, prüft Strategie, konsolidiert Ergebnisse.
+
+    Args:
+        node: Join-Node aus Workflow-Graph
+        graph: Gesamter Workflow-Graph
+        context: Execution context mit node_results
+
+    Returns:
+        JoinResult mit konsolidierten Daten
+
+    Workflow:
+        1. Sammle incoming paths (_collect_incoming_paths)
+        2. Prüfe Join-Strategie (_check_join_strategy)
+        3. Merge analysis_cores (_merge_analysis_cores)
+        4. Combine signals (_combine_signals)
+        5. Baue metadata (Pfad-Status, Statistiken)
+
+    Beispiel:
+        >>> result = evaluate_join_node(join_node, graph, context)
+        >>> result.ready
+        True
+        >>> result.consolidated_analysis_core
+        {"path_a": "Analysis A...", "path_b": "Analysis B..."}
+    """
+    logger.info(f"Evaluating join node: {node.id}")
+
+    # 1. Sammle incoming paths
+    paths = _collect_incoming_paths(node, graph, context)
+
+    if not paths:
+        # Kein eingehender Pfad (Fehlkonfiguration)
+        logger.warning(f"Join node {node.id}: No incoming edges found")
+        return JoinResult(
+            ready=False,
+            error="No incoming edges for join node",
+            metadata={"note": "Configuration error: join node must have incoming edges"}
+        )
+
+    # 2. Prüfe Join-Strategie
+    strategy = node.join_strategy or JoinStrategy.WAIT_ALL  # Default
+    skip_handling = node.skip_handling or SkipHandling.IGNORE_SKIPPED  # Default
+
+    ready, strategy_error = _check_join_strategy(paths, strategy)
+
+    if not ready:
+        # Strategie nicht erfüllt
+        executed_list = [p.node_id for p in paths if p.status == NodeStatus.EXECUTED]
+        skipped_list = [p.node_id for p in paths if p.status == NodeStatus.SKIPPED]
+        failed_list = [p.node_id for p in paths if p.status == NodeStatus.FAILED]
+
+        return JoinResult(
+            ready=False,
+            error=strategy_error,
+            metadata={
+                "join_strategy": strategy.value,
+                "total_paths": len(paths),
+                "executed_paths": len(executed_list),
+                "skipped_paths": len(skipped_list),
+                "failed_paths": len(failed_list),
+                "path_details": {
+                    "executed": executed_list,
+                    "skipped": skipped_list,
+                    "failed": failed_list
+                }
+            }
+        )
+
+    # 3. Merge analysis_cores
+    merged_cores = _merge_analysis_cores(paths, skip_handling)
+
+    # 4. Combine signals
+    combined_signals = _combine_signals(paths)
+
+    # 5. Baue metadata
+    executed_count = sum(1 for p in paths if p.status == NodeStatus.EXECUTED)
+    skipped_count = sum(1 for p in paths if p.status == NodeStatus.SKIPPED)
+    failed_count = sum(1 for p in paths if p.status == NodeStatus.FAILED)
+
+    metadata = {
+        "join_strategy": strategy.value,
+        "skip_handling": skip_handling.value,
+        "total_paths": len(paths),
+        "executed_paths": executed_count,
+        "skipped_paths": skipped_count,
+        "failed_paths": failed_count,
+        "path_details": {
+            "executed": [p.node_id for p in paths if p.status == NodeStatus.EXECUTED],
+            "skipped": [p.node_id for p in paths if p.status == NodeStatus.SKIPPED],
+            "failed": [p.node_id for p in paths if p.status == NodeStatus.FAILED]
+        }
+    }
+
+    # Spezielle Hinweise
+    if executed_count == 0 and strategy == JoinStrategy.BEST_EFFORT:
+        metadata["note"] = "No paths executed, but best_effort allows empty consolidation"
+
+    logger.info(f"Join node {node.id}: Consolidated {executed_count}/{len(paths)} paths")
+
+    return JoinResult(
+        ready=True,
+        consolidated_analysis_core=merged_cores,
+        consolidated_signals=combined_signals,
+        metadata=metadata
+    )
diff --git a/backend/version.py b/backend/version.py
index 39f746b..63fe25b 100644
--- a/backend/version.py
+++ b/backend/version.py
@@ -7,7 +7,7 @@ Semantic Versioning: MAJOR.MINOR.PATCH
 - PATCH: Bugfix, kleine Änderung, Refactor
 """
 
-APP_VERSION = "0.9l"
+APP_VERSION = "0.9m"
 BUILD_DATE = "2026-04-04"
 DB_SCHEMA_VERSION = "20260403"  # Migration 034
 
@@ -27,10 +27,26 @@ MODULE_VERSIONS = {
     "exportdata": "1.1.0",
     "importdata": "1.0.0",
     "membership": "2.1.0",
-    "workflow": "0.4.0",  # Phase 3: Logic Nodes + Conditional Branching
+    "workflow": "0.5.0",  # Phase 4: Join Nodes + Path Consolidation
 }
 
 CHANGELOG = [
+    {
+        "version": "0.9m",
+        "date": "2026-04-04",
+        "changes": [
+            "Phase 4: Join Nodes and Path Consolidation",
+            "join_evaluator.py: Join-Strategie-Evaluator (wait_all, wait_any, best_effort)",
+            "Path Status Collection: Sammelt incoming paths, prüft Ausführungsstatus",
+            "Result Consolidation: Merged analysis_cores + combined signals (mit node_id Präfix)",
+            "Skip-Handling: IGNORE_SKIPPED, USE_PLACEHOLDER, REQUIRE_MINIMUM",
+            "Partial Execution: Korrekte Behandlung von SKIPPED/FAILED Pfaden",
+            "workflow_executor.py: execute_join_node() Implementation",
+            "NodeExecutionState: List[NormalizedSignal] korrekt konvertiert zu Dict",
+            "Unit-Tests Phase 4: 18 Tests für Join Nodes (alle passing)",
+            "Phase 2/3 Backward Compatibility: 31 Tests (alle passing)",
+        ]
+    },
     {
         "version": "0.9l",
         "date": "2026-04-04",
diff --git a/backend/workflow_executor.py b/backend/workflow_executor.py
index f6ed1b9..6a9cca2 100644
--- a/backend/workflow_executor.py
+++ b/backend/workflow_executor.py
@@ -1,13 +1,14 @@
 """
-Workflow Executor (Phase 3)
+Workflow Executor (Phase 4)
 
-Führt Workflows mit conditional branching aus (Logic Nodes).
+Führt Workflows mit conditional branching und path consolidation aus.
 
 Phase 2: Sequential execution
 Phase 3: Conditional branching, Logic Nodes, Fallback strategies
+Phase 4: Join Nodes, Path consolidation
 
 Konzept-Basis: konzept_workflow_engine_konsolidated.md
-Anforderungsanalyse: anforderungsanalyse_umsetzungsplan.md (Phase 2-3)
+Anforderungsanalyse: anforderungsanalyse_umsetzungsplan.md (Phase 2-4)
 """
 from typing import Dict, Any, List, Optional, Set
 from datetime import datetime
@@ -27,6 +28,7 @@ from question_augmenter import (
 from result_container_parser import parse_result_container
 from normalization_engine import normalize_all_signals, load_question_catalog
 from logic_evaluator import evaluate_logic_expression, resolve_signal_reference
+from join_evaluator import evaluate_join_node as evaluate_join_node_core
 from db import get_db, get_cursor
 
 logger = logging.getLogger(__name__)
@@ -40,10 +42,11 @@ async def execute_workflow(
     enable_debug: bool = False
 ) -> ExecutionResult:
     """
-    Führt einen Workflow aus (mit conditional branching).
+    Führt einen Workflow aus (mit conditional branching und path consolidation).
 
     Phase 2: Linear execution in topological order.
     Phase 3: Conditional branching basierend auf logic nodes.
+    Phase 4: Join nodes und path consolidation.
 
     Args:
         workflow_id: UUID des Workflows
@@ -235,7 +238,7 @@ async def execute_node(
         - start/end: No-op
         - analysis: Load prompt → augment → LLM → parse → normalize
         - logic: Evaluate condition → activate/deactivate edges (Phase 3)
-        - join: Not implemented (Phase 4)
+        - join: Consolidate paths → merge results (Phase 4)
     """
     started_at = datetime.utcnow().isoformat()
 
@@ -254,6 +257,10 @@ async def execute_node(
         if node.type == "logic":
             return execute_logic_node(node, context, graph)
 
+        # Join Nodes (Phase 4)
+        if node.type == "join":
+            return execute_join_node(node, context, graph)
+
         # Analysis Nodes
         if node.type == "analysis":
             # 1. Lade Prompt
@@ -411,6 +418,91 @@ def execute_logic_node(
         )
 
 
+def execute_join_node(
+    node,
+    context: Dict[str, Any],
+    graph: WorkflowGraph
+) -> NodeExecutionState:
+    """
+    Führt Join Node aus (Phase 4).
+
+    Args:
+        node: WorkflowNode vom Typ "join"
+        context: Execution context mit node_results
+        graph: WorkflowGraph
+
+    Returns:
+        NodeExecutionState mit konsolidierten Daten
+
+    Logic:
+        1. Evaluiere Join-Strategie (via join_evaluator)
+        2. Prüfe ob ready (alle erforderlichen Pfade verfügbar?)
+        3. Konsolidiere Ergebnisse (merge analysis_core, combine signals)
+        4. Return NodeExecutionState mit konsolidierten Daten
+
+    Error Handling:
+        - wait_all + fehlende Pfade → FAILED
+        - wait_any + keine Pfade → FAILED
+        - best_effort + keine Pfade → EXECUTED (mit metadata)
+    """
+    started_at = datetime.utcnow().isoformat()
+
+    try:
+        logger.info(f"Executing join node: {node.id}")
+
+        # 1. Evaluiere Join-Node
+        join_result = evaluate_join_node_core(node, graph, context)
+
+        # 2. Prüfe ob ready
+        if not join_result.ready:
+            # Strategie nicht erfüllt → FAILED
+            logger.warning(f"Join node {node.id}: Not ready - {join_result.error}")
+            return NodeExecutionState(
+                node_id=node.id,
+                status=NodeStatus.FAILED,
+                error=join_result.error,
+                started_at=started_at,
+                completed_at=datetime.utcnow().isoformat(),
+                metadata=join_result.metadata
+            )
+
+        # 3. Baue konsolidierten analysis_core
+        # Format: JSON mit node_id → analysis_core mapping
+        consolidated_core_json = json.dumps(
+            join_result.consolidated_analysis_core,
+            ensure_ascii=False,
+            indent=2
+        )
+
+        # 4. Log Konsolidierung
+        executed_count = join_result.metadata.get("executed_paths", 0)
+        total_count = join_result.metadata.get("total_paths", 0)
+        logger.info(
+            f"Join node {node.id}: Consolidated {executed_count}/{total_count} paths"
+        )
+
+        # 5. Return NodeExecutionState
+        return NodeExecutionState(
+            node_id=node.id,
+            status=NodeStatus.EXECUTED,
+            analysis_core=consolidated_core_json,
+            normalized_signals=join_result.consolidated_signals,
+            metadata=join_result.metadata,
+            started_at=started_at,
+            completed_at=datetime.utcnow().isoformat()
+        )
+
+    except Exception as e:
+        logger.error(f"Join node execution failed ({node.id}): {e}", exc_info=True)
+        return NodeExecutionState(
+            node_id=node.id,
+            status=NodeStatus.FAILED,
+            error=str(e),
+            started_at=started_at,
+            completed_at=datetime.utcnow().isoformat()
+        )
+
+
 def _apply_fallback(
     node,
     graph: WorkflowGraph,
diff --git a/tests/backend/test_phase2_workflow_executor.py b/tests/backend/test_phase2_workflow_executor.py
index 797d2cd..15a42e0 100644
--- a/tests/backend/test_phase2_workflow_executor.py
+++ b/tests/backend/test_phase2_workflow_executor.py
@@ -216,26 +216,33 @@ async def test_execute_node_start_end():
 
 
 @pytest.mark.asyncio
-async def test_execute_node_unknown_type():
-    """Test: Unbekannter Node-Typ wirft Fehler"""
+async def test_execute_node_join_implemented():
+    """Test: Join Node ist jetzt implementiert (Phase 4)"""
     from workflow_executor import execute_node
-    from workflow_models import WorkflowNode, WorkflowGraph
+    from workflow_models import WorkflowNode, WorkflowGraph, JoinStrategy
 
-    # Phase 3: logic is now implemented, test with join instead
-    join_node = WorkflowNode(id="join1", type="join")
+    # Phase 4: join nodes sind jetzt implementiert
+    join_node = WorkflowNode(id="join1", type="join", join_strategy=JoinStrategy.BEST_EFFORT)
 
-    context = {"variables": {}, "profile_id": "test"}
+    # Minimal-context (kein incoming path vorhanden)
+    context = {
+        "variables": {},
+        "profile_id": "test",
+        "node_results": {},  # Keine incoming paths
+        "active_edges": {}
+    }
     catalog = {}
-    mock_graph = WorkflowGraph(nodes=[], edges=[])
+    mock_graph = WorkflowGraph(nodes=[join_node], edges=[])
 
     async def mock_llm(prompt, model):
         return ""
 
     result = await execute_node(join_node, context, catalog, mock_graph, mock_llm)
 
-    # Sollte FAILED sein mit Fehlermeldung
-    assert result.status == NodeStatus.FAILED
-    assert "not implemented" in result.error.lower() or "phase 4" in result.error.lower()
+    # Join node sollte erfolgreich ausgeführt werden (best_effort mit 0 Pfaden)
+    # oder FAILED mit sinnvoller Fehlermeldung (keine incoming edges)
+    assert result.status in [NodeStatus.EXECUTED, NodeStatus.FAILED]
+    assert result.node_id == "join1"
 
 
 @pytest.mark.asyncio
diff --git a/tests/backend/test_phase4_join_nodes.py b/tests/backend/test_phase4_join_nodes.py
new file mode 100644
index 0000000..649d39d
--- /dev/null
+++ b/tests/backend/test_phase4_join_nodes.py
@@ -0,0 +1,511 @@
+"""
+Phase 4 Tests: Join Nodes and Path Consolidation
+
+Tests für join_evaluator.py und execute_join_node() Funktionalität.
+
+Test-Kategorien:
+- Join Strategy Tests (wait_all, wait_any, best_effort)
+- Skip Handling Tests (ignore_skipped, use_placeholder)
+- Result Consolidation Tests (merge analysis_cores, combine signals)
+- Partial Execution Tests (failed paths, skipped paths, mixed status)
+"""
+
+import pytest
+from typing import Dict, Any
+from workflow_models import (
+    WorkflowNode,
+    WorkflowGraph,
+    WorkflowEdge,
+    JoinStrategy,
+    SkipHandling,
+    NodeStatus,
+    NormalizedSignal,
+    SignalStatus,
+    NodeExecutionState
+)
+from join_evaluator import (
+    evaluate_join_node,
+    _collect_incoming_paths,
+    _check_join_strategy,
+    _merge_analysis_cores,
+    _combine_signals,
+    PathStatus
+)
+
+
+# ── Fixtures ──────────────────────────────────────────────────────────────────
+
+
+@pytest.fixture
+def simple_graph():
+    """
+    Einfacher Graph mit 2 Pfaden + Join:
+        start → path_a → join → end
+              → path_b →
+    """
+    nodes = [
+        WorkflowNode(id="start", type="start"),
+        WorkflowNode(id="path_a", type="analysis", prompt_slug="prompt_a"),
+        WorkflowNode(id="path_b", type="analysis", prompt_slug="prompt_b"),
+        WorkflowNode(id="join", type="join", join_strategy=JoinStrategy.WAIT_ALL),
+        WorkflowNode(id="end", type="end")
+    ]
+    edges = [
+        WorkflowEdge(id="e1", from_node="start", to_node="path_a"),
+        WorkflowEdge(id="e2", from_node="start", to_node="path_b"),
+        WorkflowEdge(id="e3", from_node="path_a", to_node="join"),
+        WorkflowEdge(id="e4", from_node="path_b", to_node="join"),
+        WorkflowEdge(id="e5", from_node="join", to_node="end")
+    ]
+    return WorkflowGraph(nodes=nodes, edges=edges)
+
+
+@pytest.fixture
+def context_all_executed():
+    """Context mit beiden Pfaden EXECUTED"""
+    return {
+        "node_results": {
+            "path_a": NodeExecutionState(
+                node_id="path_a",
+                status=NodeStatus.EXECUTED,
+                analysis_core="Analysis from path A",
+                normalized_signals=[
+                    NormalizedSignal(
+                        question_type="relevanz",
+                        raw_value="hoch",
+                        normalized_value="hoch",
+                        status=SignalStatus.VALID
+                    )
+                ]
+            ),
+            "path_b": NodeExecutionState(
+                node_id="path_b",
+                status=NodeStatus.EXECUTED,
+                analysis_core="Analysis from path B",
+                normalized_signals=[
+                    NormalizedSignal(
+                        question_type="prioritaet",
+                        raw_value="mittel",
+                        normalized_value="mittel",
+                        status=SignalStatus.VALID
+                    )
+                ]
+            )
+        }
+    }
+
+
+@pytest.fixture
+def context_one_skipped():
+    """Context mit einem Pfad SKIPPED"""
+    return {
+        "node_results": {
+            "path_a": NodeExecutionState(
+                node_id="path_a",
+                status=NodeStatus.EXECUTED,
+                analysis_core="Analysis from path A"
+            ),
+            "path_b": NodeExecutionState(
+                node_id="path_b",
+                status=NodeStatus.SKIPPED,
+                analysis_core=None
+            )
+        }
+    }
+
+
+@pytest.fixture
+def context_one_failed():
+    """Context mit einem Pfad FAILED"""
+    return {
+        "node_results": {
+            "path_a": NodeExecutionState(
+                node_id="path_a",
+                status=NodeStatus.EXECUTED,
+                analysis_core="Analysis from path A"
+            ),
+            "path_b": NodeExecutionState(
+                node_id="path_b",
+                status=NodeStatus.FAILED,
+                analysis_core=None,
+                error="LLM call failed"
+            )
+        }
+    }
+
+
+@pytest.fixture
+def context_no_paths():
+    """Context ohne ausgeführte Pfade"""
+    return {
+        "node_results": {
+            "path_a": NodeExecutionState(
+                node_id="path_a",
+                status=NodeStatus.SKIPPED,
+                analysis_core=None
+            ),
+            "path_b": NodeExecutionState(
+                node_id="path_b",
+                status=NodeStatus.SKIPPED,
+                analysis_core=None
+            )
+        }
+    }
+
+
+# ── Join Strategy Tests ───────────────────────────────────────────────────────
+
+
+def test_wait_all_success(simple_graph, context_all_executed):
+    """wait_all: Alle Pfade verfügbar → ready=True, EXECUTED"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.WAIT_ALL
+
+    result = evaluate_join_node(join_node, simple_graph, context_all_executed)
+
+    assert result.ready is True
+    assert result.error is None
+    assert len(result.consolidated_analysis_core) == 2
+    assert "path_a" in result.consolidated_analysis_core
+    assert "path_b" in result.consolidated_analysis_core
+    assert result.metadata["executed_paths"] == 2
+
+
+def test_wait_all_missing_path(simple_graph, context_one_skipped):
+    """wait_all: Ein Pfad fehlt → ready=False, FAILED"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.WAIT_ALL
+
+    result = evaluate_join_node(join_node, simple_graph, context_one_skipped)
+
+    assert result.ready is False
+    assert result.error is not None
+    assert "wait_all strategy failed" in result.error
+    assert "path_b" in result.error
+    assert result.metadata["executed_paths"] == 1
+    assert result.metadata["skipped_paths"] == 1
+
+
+def test_wait_any_one_path(simple_graph, context_one_skipped):
+    """wait_any: Mindestens ein Pfad → ready=True, EXECUTED"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.WAIT_ANY
+
+    result = evaluate_join_node(join_node, simple_graph, context_one_skipped)
+
+    assert result.ready is True
+    assert result.error is None
+    assert len(result.consolidated_analysis_core) == 1
+    assert "path_a" in result.consolidated_analysis_core
+    assert result.metadata["executed_paths"] == 1
+
+
+def test_wait_any_no_paths(simple_graph, context_no_paths):
+    """wait_any: Keine Pfade → ready=False, FAILED"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.WAIT_ANY
+
+    result = evaluate_join_node(join_node, simple_graph, context_no_paths)
+
+    assert result.ready is False
+    assert result.error is not None
+    assert "wait_any strategy failed" in result.error
+    assert result.metadata["executed_paths"] == 0
+
+
+def test_best_effort_partial(simple_graph, context_one_skipped):
+    """best_effort: Einige Pfade fehlen → ready=True, EXECUTED"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.BEST_EFFORT
+
+    result = evaluate_join_node(join_node, simple_graph, context_one_skipped)
+
+    assert result.ready is True
+    assert result.error is None
+    assert len(result.consolidated_analysis_core) == 1
+    assert result.metadata["executed_paths"] == 1
+    assert result.metadata["skipped_paths"] == 1
+
+
+def test_best_effort_no_paths(simple_graph, context_no_paths):
+    """best_effort: Keine Pfade → ready=True, EXECUTED (leere Konsolidierung)"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.BEST_EFFORT
+
+    result = evaluate_join_node(join_node, simple_graph, context_no_paths)
+
+    assert result.ready is True
+    assert result.error is None
+    assert len(result.consolidated_analysis_core) == 0  # Leer
+    assert result.metadata["executed_paths"] == 0
+    assert "note" in result.metadata  # Hinweis auf leere Konsolidierung
+
+
+# ── Skip Handling Tests ───────────────────────────────────────────────────────
+
+
+def test_ignore_skipped(simple_graph, context_one_skipped):
+    """IGNORE_SKIPPED: Übersprungene Pfade nicht in Ergebnis"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.BEST_EFFORT
+    join_node.skip_handling = SkipHandling.IGNORE_SKIPPED
+
+    result = evaluate_join_node(join_node, simple_graph, context_one_skipped)
+
+    assert result.ready is True
+    assert len(result.consolidated_analysis_core) == 1
+    assert "path_a" in result.consolidated_analysis_core
+    assert "path_b" not in result.consolidated_analysis_core
+
+
+def test_use_placeholder(simple_graph, context_one_skipped):
+    """USE_PLACEHOLDER: Platzhalter für übersprungene Pfade"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.BEST_EFFORT
+    join_node.skip_handling = SkipHandling.USE_PLACEHOLDER
+
+    result = evaluate_join_node(join_node, simple_graph, context_one_skipped)
+
+    assert result.ready is True
+    assert len(result.consolidated_analysis_core) == 2
+    assert "path_a" in result.consolidated_analysis_core
+    assert "path_b" in result.consolidated_analysis_core
+    assert "[Path skipped:" in result.consolidated_analysis_core["path_b"]
+
+
+def test_failed_path_placeholder(simple_graph, context_one_failed):
+    """FAILED Pfade bekommen Platzhalter (unabhängig von skip_handling)"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+    join_node.join_strategy = JoinStrategy.BEST_EFFORT
+
+    result = evaluate_join_node(join_node, simple_graph, context_one_failed)
+
+    assert result.ready is True
+    assert len(result.consolidated_analysis_core) == 2
+    assert "path_a" in result.consolidated_analysis_core
+    assert "[Path failed:" in result.consolidated_analysis_core["path_b"]
+
+
+# ── Result Consolidation Tests ────────────────────────────────────────────────
+
+
+def test_merge_analysis_cores(simple_graph, context_all_executed):
+    """Analyse-Kerne korrekt merged"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+
+    result = evaluate_join_node(join_node, simple_graph, context_all_executed)
+
+    assert result.ready is True
+    assert len(result.consolidated_analysis_core) == 2
+    assert result.consolidated_analysis_core["path_a"] == "Analysis from path A"
+    assert result.consolidated_analysis_core["path_b"] == "Analysis from path B"
+
+
+def test_combine_signals(simple_graph, context_all_executed):
+    """Signale aller Pfade kombiniert (mit node_id Präfix)"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+
+    result = evaluate_join_node(join_node, simple_graph, context_all_executed)
+
+    assert result.ready is True
+    assert len(result.consolidated_signals) == 2
+
+    # Signale sind mit node_id geprefixed
+    assert "path_a.relevanz" in result.consolidated_signals
+    assert "path_b.prioritaet" in result.consolidated_signals
+
+    # Signal-Werte korrekt übernommen
+    assert result.consolidated_signals["path_a.relevanz"].normalized_value == "hoch"
+    assert result.consolidated_signals["path_b.prioritaet"].normalized_value == "mittel"
+
+
+def test_signal_name_collision():
+    """Gleiche Signal-Namen in verschiedenen Pfaden (Präfix verhindert Kollision)"""
+    graph = WorkflowGraph(
+        nodes=[
+            WorkflowNode(id="path_a", type="analysis"),
+            WorkflowNode(id="path_b", type="analysis"),
+            WorkflowNode(id="join", type="join", join_strategy=JoinStrategy.WAIT_ALL)
+        ],
+        edges=[
+            WorkflowEdge(id="e1", from_node="path_a", to_node="join"),
+            WorkflowEdge(id="e2", from_node="path_b", to_node="join")
+        ]
+    )
+
+    context = {
+        "node_results": {
+            "path_a": NodeExecutionState(
+                node_id="path_a",
+                status=NodeStatus.EXECUTED,
+                analysis_core="A",
+                normalized_signals=[
+                    NormalizedSignal(
+                        question_type="relevanz",
+                        raw_value="hoch",
+                        normalized_value="hoch",
+                        status=SignalStatus.VALID
+                    )
+                ]
+            ),
+            "path_b": NodeExecutionState(
+                node_id="path_b",
+                status=NodeStatus.EXECUTED,
+                analysis_core="B",
+                normalized_signals=[
+                    NormalizedSignal(  # Gleicher Name!
+                        question_type="relevanz",
+                        raw_value="mittel",
+                        normalized_value="mittel",
+                        status=SignalStatus.VALID
+                    )
+                ]
+            )
+        }
+    }
+
+    join_node = graph.nodes[2]
+    result = evaluate_join_node(join_node, graph, context)
+
+    # Beide Signale vorhanden (durch Präfix unterscheidbar)
+    assert "path_a.relevanz" in result.consolidated_signals
+    assert "path_b.relevanz" in result.consolidated_signals
+    assert result.consolidated_signals["path_a.relevanz"].normalized_value == "hoch"
+    assert result.consolidated_signals["path_b.relevanz"].normalized_value == "mittel"
+
+
+# ── Partial Execution Tests ───────────────────────────────────────────────────
+
+
+def test_mixed_status_paths():
+    """Kombination EXECUTED/SKIPPED/FAILED"""
+    graph = WorkflowGraph(
+        nodes=[
+            WorkflowNode(id="path_a", type="analysis"),
+            WorkflowNode(id="path_b", type="analysis"),
+            WorkflowNode(id="path_c", type="analysis"),
+            WorkflowNode(id="join", type="join", join_strategy=JoinStrategy.BEST_EFFORT)
+        ],
+        edges=[
+            WorkflowEdge(id="e1", from_node="path_a", to_node="join"),
+            WorkflowEdge(id="e2", from_node="path_b", to_node="join"),
+            WorkflowEdge(id="e3", from_node="path_c", to_node="join")
+        ]
+    )
+
+    context = {
+        "node_results": {
+            "path_a": NodeExecutionState(
+                node_id="path_a",
+                status=NodeStatus.EXECUTED,
+                analysis_core="Analysis A"
+            ),
+            "path_b": NodeExecutionState(
+                node_id="path_b",
+                status=NodeStatus.SKIPPED,
+                analysis_core=None
+            ),
+            "path_c": NodeExecutionState(
+                node_id="path_c",
+                status=NodeStatus.FAILED,
+                error="Error",
+                analysis_core=None
+            )
+        }
+    }
+
+    join_node = graph.nodes[3]
+    result = evaluate_join_node(join_node, graph, context)
+
+    assert result.ready is True
+    assert result.metadata["executed_paths"] == 1
+    assert result.metadata["skipped_paths"] == 1
+    assert result.metadata["failed_paths"] == 1
+
+    # Analysis core nur von path_a (executed)
+    assert "path_a" in result.consolidated_analysis_core
+    assert "path_c" in result.consolidated_analysis_core  # Failed → Placeholder
+    assert "[Path failed:" in result.consolidated_analysis_core["path_c"]
+
+
+# ── Helper Function Tests ─────────────────────────────────────────────────────
+
+
+def test_collect_incoming_paths(simple_graph, context_all_executed):
+    """_collect_incoming_paths sammelt alle Pfade"""
+    join_node = next(n for n in simple_graph.nodes if n.id == "join")
+
+    paths = _collect_incoming_paths(join_node, simple_graph, context_all_executed)
+
+    assert len(paths) == 2
+    assert paths[0].node_id in ["path_a", "path_b"]
+    assert paths[1].node_id in ["path_a", "path_b"]
+    assert all(p.status == NodeStatus.EXECUTED for p in paths)
+
+
+def test_check_join_strategy_wait_all():
+    """_check_join_strategy für wait_all"""
+    paths = [
+        PathStatus("path_a", NodeStatus.EXECUTED, "A", {}),
+        PathStatus("path_b", NodeStatus.EXECUTED, "B", {})
+    ]
+
+    ready, error = _check_join_strategy(paths, JoinStrategy.WAIT_ALL)
+    assert ready is True
+    assert error is None
+
+
+def test_check_join_strategy_wait_all_failed():
+    """_check_join_strategy für wait_all mit fehlenden Pfaden"""
+    paths = [
+        PathStatus("path_a", NodeStatus.EXECUTED, "A", {}),
+        PathStatus("path_b", NodeStatus.SKIPPED, None, {})
+    ]
+
+    ready, error = _check_join_strategy(paths, JoinStrategy.WAIT_ALL)
+    assert ready is False
+    assert error is not None
+    assert "wait_all strategy failed" in error
+
+
+def test_merge_analysis_cores_helper():
+    """_merge_analysis_cores merged Kerne korrekt"""
+    paths = [
+        PathStatus("path_a", NodeStatus.EXECUTED, "Analysis A", {}),
+        PathStatus("path_b", NodeStatus.EXECUTED, "Analysis B", {}),
+        PathStatus("path_c", NodeStatus.SKIPPED, None, {})
+    ]
+
+    merged = _merge_analysis_cores(paths, SkipHandling.IGNORE_SKIPPED)
+
+    assert len(merged) == 2
+    assert merged["path_a"] == "Analysis A"
+    assert merged["path_b"] == "Analysis B"
+    assert "path_c" not in merged
+
+
+def test_combine_signals_helper():
+    """_combine_signals kombiniert Signale mit Präfix"""
+    signal_a = NormalizedSignal(
+        question_type="relevanz",
+        raw_value="hoch",
+        normalized_value="hoch",
+        status=SignalStatus.VALID
+    )
+    signal_b = NormalizedSignal(
+        question_type="prioritaet",
+        raw_value="mittel",
+        normalized_value="mittel",
+        status=SignalStatus.VALID
+    )
+
+    paths = [
+        PathStatus("path_a", NodeStatus.EXECUTED, "A", {"relevanz": signal_a}),
+        PathStatus("path_b", NodeStatus.EXECUTED, "B", {"prioritaet": signal_b})
+    ]
+
+    combined = _combine_signals(paths)
+
+    assert len(combined) == 2
+    assert "path_a.relevanz" in combined
+    assert "path_b.prioritaet" in combined