feat(kernel): add multi-skill orchestration bridge + true parallel execution

- Kernel orchestration bridge: execute_orchestration, auto_compose_skills, validate_orchestration methods on Kernel struct - True parallel execution: replace sequential for-loop with tokio::JoinSet for concurrent node execution within parallel groups - Tauri commands: orchestration_execute (auto-compose or pre-defined graph), orchestration_validate (dry-run validation) - Full type conversions: OrchestrationRequest/Response with camelCase serde Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-04-04 09:18:26 +08:00
parent 1399054547
commit f4ed1b33e0
6 changed files with 422 additions and 37 deletions
--- a/crates/zclaw-kernel/src/kernel/mod.rs
+++ b/crates/zclaw-kernel/src/kernel/mod.rs
@@ -7,6 +7,7 @@ mod skills;
 mod hands;
 mod triggers;
 mod approvals;
 mod orchestration;
 #[cfg(feature = "multi-agent")]
 mod a2a;
--- a/crates/zclaw-kernel/src/kernel/orchestration.rs
+++ b/crates/zclaw-kernel/src/kernel/orchestration.rs
@@ -0,0 +1,71 @@
 //! Kernel-level orchestration methods
 //!
 //! Bridges the zclaw-skills orchestration engine to the Kernel,
 //! providing high-level orchestration execution via Tauri commands.
 use std::collections::HashMap;
 use serde_json::Value;
 use zclaw_types::Result;
 use super::Kernel;
 use zclaw_skills::orchestration::{OrchestrationPlanner, SkillGraphExecutor};
 impl Kernel {
    /// Execute a skill orchestration graph with the given inputs.
    ///
    /// This creates a `DefaultExecutor` backed by the kernel's `SkillRegistry`,
    /// builds an execution plan, and runs the graph with true parallel execution
    /// within each parallel group.
    pub async fn execute_orchestration(
        &self,
        graph: &zclaw_skills::orchestration::SkillGraph,
        inputs: HashMap<String, Value>,
        context: &zclaw_skills::SkillContext,
    ) -> Result<zclaw_skills::orchestration::OrchestrationResult> {
        let executor = zclaw_skills::orchestration::DefaultExecutor::new(
            self.skills.clone(),
        );
        executor.execute(graph, inputs, context).await
    }
    /// Execute an orchestration with progress tracking.
    ///
    /// The `progress_fn` callback is invoked at each stage of execution,
    /// allowing the frontend to display real-time progress.
    pub async fn execute_orchestration_with_progress<F>(
        &self,
        graph: &zclaw_skills::orchestration::SkillGraph,
        inputs: HashMap<String, Value>,
        context: &zclaw_skills::SkillContext,
        progress_fn: F,
    ) -> Result<zclaw_skills::orchestration::OrchestrationResult>
    where
        F: Fn(zclaw_skills::orchestration::OrchestrationProgress) + Send + Sync,
    {
        let executor = zclaw_skills::orchestration::DefaultExecutor::new(
            self.skills.clone(),
        );
        executor.execute_with_progress(graph, inputs, context, progress_fn).await
    }
    /// Auto-compose a skill graph from a list of skill IDs.
    ///
    /// Analyzes input/output schemas to infer data flow edges between skills.
    pub async fn auto_compose_skills(
        &self,
        skill_ids: &[zclaw_types::SkillId],
    ) -> Result<zclaw_skills::orchestration::SkillGraph> {
        let planner = zclaw_skills::orchestration::DefaultPlanner::new();
        planner.auto_compose(skill_ids, &self.skills).await
    }
    /// Validate a skill graph without executing it.
    pub async fn validate_orchestration(
        &self,
        graph: &zclaw_skills::orchestration::SkillGraph,
    ) -> Vec<zclaw_skills::orchestration::ValidationError> {
        zclaw_skills::orchestration::validate_graph(graph, &self.skills).await
    }
 }
--- a/crates/zclaw-skills/src/orchestration/executor.rs
+++ b/crates/zclaw-skills/src/orchestration/executor.rs
@@ -17,6 +17,12 @@ use super::{
    planner::OrchestrationPlanner,
 };
 /// Wrapper to make NodeResult Send for JoinSet
 struct ParallelNodeResult {
    node_id: String,
    result: NodeResult,
 }
 /// Skill graph executor trait
 #[async_trait::async_trait]
 pub trait SkillGraphExecutor: Send + Sync {
@@ -76,7 +82,8 @@ impl DefaultExecutor {
        cancellations.get(graph_id).copied().unwrap_or(false)
    }
-    /// Execute a single node
+    /// Execute a single node (used by pipeline orchestration action driver)
    #[allow(dead_code)]
    async fn execute_node(
        &self,
        node: &super::SkillNode,
@@ -201,7 +208,7 @@ impl SkillGraphExecutor for DefaultExecutor {
        let mut node_results: HashMap<String, NodeResult> = HashMap::new();
        let mut progress = OrchestrationProgress::new(&graph.id, graph.nodes.len());
-        // Execute parallel groups
+        // Execute parallel groups sequentially, but nodes within each group in parallel
        for group in &plan.parallel_groups {
            if self.is_cancelled(&graph.id).await {
                return Ok(OrchestrationResult {
@@ -213,40 +220,72 @@ impl SkillGraphExecutor for DefaultExecutor {
                });
            }
-            // Execute nodes in parallel within the group
+            progress.status = format!("Executing group with {} nodes", group.len());
            progress_fn(progress.clone());
            // Execute all nodes in the group concurrently using JoinSet
            let mut join_set = tokio::task::JoinSet::new();
            for node_id in group {
                if let Some(node) = graph.nodes.iter().find(|n| &n.id == node_id) {
-                    progress.current_node = Some(node_id.clone());
+                    let node = node.clone();
-                    progress_fn(progress.clone());
+                    let node_id = node_id.clone();
                    let orch_ctx = orch_context.clone();
                    let skill_ctx = context.clone();
                    let registry = self.registry.clone();
-                    let result = self.execute_node(node, &orch_context, context).await
+                    join_set.spawn(async move {
-                        .unwrap_or_else(|e| NodeResult {
+                        let input = orch_ctx.resolve_node_input(&node);
-                            node_id: node_id.clone(),
+                        let start = Instant::now();
-                            success: false,
+
-                            output: Value::Null,
+                        let result = registry.execute(&node.skill_id, &skill_ctx, input).await;
-                            error: Some(e.to_string()),
+                        let nr = match result {
-                            duration_ms: 0,
+                            Ok(sr) if sr.success => NodeResult {
-                            retries: 0,
+                                node_id: node_id.clone(),
-                            skipped: false,
+                                success: true,
-                        });
+                                output: sr.output,
-                    node_results.insert(node_id.clone(), result);
+                                error: None,
                                duration_ms: start.elapsed().as_millis() as u64,
                                retries: 0,
                                skipped: false,
                            },
                            Ok(sr) => NodeResult {
                                node_id: node_id.clone(),
                                success: false,
                                output: Value::Null,
                                error: sr.error,
                                duration_ms: start.elapsed().as_millis() as u64,
                                retries: 0,
                                skipped: false,
                            },
                            Err(e) => NodeResult {
                                node_id: node_id.clone(),
                                success: false,
                                output: Value::Null,
                                error: Some(e.to_string()),
                                duration_ms: start.elapsed().as_millis() as u64,
                                retries: 0,
                                skipped: false,
                            },
                        };
                        ParallelNodeResult { node_id, result: nr }
                    });
                }
            }
-            // Update context with node outputs
+            // Collect results as tasks complete
-            for node_id in group {
+            while let Some(join_result) = join_set.join_next().await {
-                if let Some(result) = node_results.get(node_id) {
+                match join_result {
-                    if result.success {
+                    Ok(parallel_result) => {
-                        orch_context.set_node_output(node_id, result.output.clone());
+                        let ParallelNodeResult { node_id, result } = parallel_result;
-                        progress.completed_nodes.push(node_id.clone());
+                        if result.success {
-                    } else {
+                            orch_context.set_node_output(&node_id, result.output.clone());
-                        progress.failed_nodes.push(node_id.clone());
+                            progress.completed_nodes.push(node_id.clone());
-
+                        } else {
-                        // Handle error based on strategy
+                            progress.failed_nodes.push(node_id.clone());
-                        match graph.on_error {
+                            if matches!(graph.on_error, ErrorStrategy::Stop) {
                            ErrorStrategy::Stop => {
                                // Clone error before moving node_results
                                let error = result.error.clone();
                                node_results.insert(node_id, result);
                                join_set.abort_all();
                                return Ok(OrchestrationResult {
                                    success: false,
                                    output: Value::Null,
@@ -255,27 +294,24 @@ impl SkillGraphExecutor for DefaultExecutor {
                                    error,
                                });
                            }
                            ErrorStrategy::Continue => {
                                // Continue to next group
                            }
                            ErrorStrategy::Retry => {
                                // Already handled in execute_node
                            }
                        }
                        node_results.insert(node_id, result);
                    }
                    Err(e) => {
                        tracing::warn!("[Orchestration] Task panicked: {}", e);
                    }
                }
            }
            // Update progress
            progress.progress_percent = ((progress.completed_nodes.len() + progress.failed_nodes.len())
-                * 100 / graph.nodes.len()) as u8;
+                * 100 / graph.nodes.len().max(1)) as u8;
            progress.status = format!("Completed group with {} nodes", group.len());
            progress_fn(progress.clone());
        }
        // Build final output
        let output = orch_context.build_output(&graph.output_mapping);
        let success = progress.failed_nodes.is_empty();
        Ok(OrchestrationResult {
--- a/desktop/src-tauri/src/kernel_commands/mod.rs
+++ b/desktop/src-tauri/src/kernel_commands/mod.rs
@@ -13,6 +13,7 @@ pub mod chat;
 pub mod hand;
 pub mod lifecycle;
 pub mod mcp;
 pub mod orchestration;
 pub mod scheduled_task;
 pub mod skill;
 pub mod trigger;
--- a/desktop/src-tauri/src/kernel_commands/orchestration.rs
+++ b/desktop/src-tauri/src/kernel_commands/orchestration.rs
@@ -0,0 +1,273 @@
 //! Skill orchestration Tauri commands
 //!
 //! Exposes the multi-skill orchestration engine to the frontend,
 //! enabling parallel/serial/conditional execution of skill graphs.
 use std::collections::HashMap;
 use serde::{Deserialize, Serialize};
 use serde_json::Value;
 use tauri::State;
 use super::KernelState;
 // ============================================================================
 // Request/Response Types
 // ============================================================================
 /// Orchestration execution request
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct OrchestrationRequest {
    /// Skill IDs to orchestrate (for auto-compose)
    pub skill_ids: Vec<String>,
    /// Optional pre-defined graph (overrides auto-compose)
    pub graph: Option<OrchestrationGraphInput>,
    /// Input data for the orchestration
    pub inputs: HashMap<String, Value>,
    /// Agent context
    pub agent_id: String,
    pub session_id: String,
 }
 /// Graph input for pre-defined orchestration
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct OrchestrationGraphInput {
    pub id: String,
    pub name: String,
    #[serde(default)]
    pub description: String,
    pub nodes: Vec<NodeInput>,
    #[serde(default)]
    pub edges: Vec<EdgeInput>,
    #[serde(default)]
    pub on_error: Option<String>,
    #[serde(default)]
    pub timeout_secs: Option<u64>,
 }
 /// Node input for orchestration graph
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct NodeInput {
    pub id: String,
    pub skill_id: String,
    #[serde(default)]
    pub description: String,
    #[serde(default)]
    pub input_mappings: HashMap<String, String>,
    #[serde(default)]
    pub when: Option<String>,
    #[serde(default)]
    pub skip_on_error: Option<bool>,
    #[serde(default)]
    pub timeout_secs: Option<u64>,
 }
 /// Edge input for orchestration graph
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct EdgeInput {
    pub from_node: String,
    pub to_node: String,
    #[serde(default)]
    pub field_mapping: HashMap<String, String>,
    #[serde(default)]
    pub condition: Option<String>,
 }
 /// Orchestration execution result for frontend
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct OrchestrationResponse {
    pub success: bool,
    pub output: Value,
    pub node_count: usize,
    pub completed_nodes: usize,
    pub failed_nodes: usize,
    pub duration_ms: u64,
    pub error: Option<String>,
    pub node_results: HashMap<String, NodeResultResponse>,
 }
 /// Node execution result for frontend
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct NodeResultResponse {
    pub success: bool,
    pub output: Value,
    pub error: Option<String>,
    pub duration_ms: u64,
    pub retries: u32,
    pub skipped: bool,
 }
 /// Validation response for frontend
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct ValidationResponse {
    pub valid: bool,
    pub errors: Vec<ValidationErrorInfo>,
 }
 /// Validation error info
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(rename_all = "camelCase")]
 pub struct ValidationErrorInfo {
    pub code: String,
    pub message: String,
    pub location: Option<String>,
 }
 // ============================================================================
 // Type Conversions
 // ============================================================================
 impl TryFrom<OrchestrationGraphInput> for zclaw_skills::orchestration::SkillGraph {
    type Error = String;
    fn try_from(input: OrchestrationGraphInput) -> Result<Self, Self::Error> {
        let nodes: Vec<zclaw_skills::orchestration::SkillNode> = input.nodes.into_iter().map(|n| {
            zclaw_skills::orchestration::SkillNode {
                id: n.id,
                skill_id: zclaw_types::SkillId::new(&n.skill_id),
                description: n.description,
                input_mappings: n.input_mappings,
                retry: None,
                timeout_secs: n.timeout_secs,
                when: n.when,
                skip_on_error: n.skip_on_error.unwrap_or(false),
            }
        }).collect();
        let edges: Vec<zclaw_skills::orchestration::SkillEdge> = input.edges.into_iter().map(|e| {
            zclaw_skills::orchestration::SkillEdge {
                from_node: e.from_node,
                to_node: e.to_node,
                field_mapping: e.field_mapping,
                condition: e.condition,
            }
        }).collect();
        let on_error = match input.on_error.as_deref() {
            Some("continue") => zclaw_skills::orchestration::ErrorStrategy::Continue,
            Some("retry") => zclaw_skills::orchestration::ErrorStrategy::Retry,
            _ => zclaw_skills::orchestration::ErrorStrategy::Stop,
        };
        Ok(zclaw_skills::orchestration::SkillGraph {
            id: input.id,
            name: input.name,
            description: input.description,
            nodes,
            edges,
            input_schema: None,
            output_mapping: HashMap::new(),
            on_error,
            timeout_secs: input.timeout_secs.unwrap_or(300),
        })
    }
 }
 impl From<zclaw_skills::orchestration::OrchestrationResult> for OrchestrationResponse {
    fn from(result: zclaw_skills::orchestration::OrchestrationResult) -> Self {
        let completed = result.node_results.values().filter(|r| r.success).count();
        let failed = result.node_results.values().filter(|r| !r.success).count();
        let node_results = result.node_results.into_iter().map(|(id, nr)| {
            (id, NodeResultResponse {
                success: nr.success,
                output: nr.output,
                error: nr.error,
                duration_ms: nr.duration_ms,
                retries: nr.retries,
                skipped: nr.skipped,
            })
        }).collect();
        Self {
            success: result.success,
            output: result.output,
            node_count: completed + failed,
            completed_nodes: completed,
            failed_nodes: failed,
            duration_ms: result.duration_ms,
            error: result.error,
            node_results,
        }
    }
 }
 // ============================================================================
 // Tauri Commands
 // ============================================================================
 /// Execute a skill orchestration
 ///
 /// Either auto-composes a graph from skill_ids, or uses a pre-defined graph.
 /// Executes with true parallel execution within each dependency level.
 #[tauri::command]
 pub async fn orchestration_execute(
    state: State<'_, KernelState>,
    request: OrchestrationRequest,
 ) -> Result<OrchestrationResponse, String> {
    let kernel_lock = state.lock().await;
    let kernel = kernel_lock.as_ref()
        .ok_or_else(|| "Kernel not initialized".to_string())?;
    // Build or auto-compose graph
    let graph = if let Some(graph_input) = request.graph {
        graph_input.try_into()?
    } else if request.skill_ids.is_empty() {
        return Err("Must provide either skill_ids or graph".to_string());
    } else {
        let skill_ids: Vec<zclaw_types::SkillId> = request.skill_ids.iter()
            .map(|s| zclaw_types::SkillId::new(s))
            .collect();
        kernel.auto_compose_skills(&skill_ids).await
            .map_err(|e| format!("Auto-compose failed: {}", e))?
    };
    // Build skill context
    let context = zclaw_skills::SkillContext {
        agent_id: request.agent_id,
        session_id: request.session_id,
        working_dir: None,
        env: HashMap::new(),
        timeout_secs: graph.timeout_secs,
        network_allowed: true,
        file_access_allowed: true,
        llm: None,
    };
    // Execute orchestration
    let result = kernel.execute_orchestration(&graph, request.inputs, &context).await
        .map_err(|e| format!("Orchestration failed: {}", e))?;
    Ok(OrchestrationResponse::from(result))
 }
 /// Validate an orchestration graph without executing it
 #[tauri::command]
 pub async fn orchestration_validate(
    state: State<'_, KernelState>,
    graph: OrchestrationGraphInput,
 ) -> Result<ValidationResponse, String> {
    let kernel_lock = state.lock().await;
    let kernel = kernel_lock.as_ref()
        .ok_or_else(|| "Kernel not initialized".to_string())?;
    let skill_graph: zclaw_skills::orchestration::SkillGraph = graph.try_into()?;
    let errors = kernel.validate_orchestration(&skill_graph).await;
    let valid = errors.is_empty();
    let error_infos = errors.into_iter().map(|e| ValidationErrorInfo {
        code: e.code,
        message: e.message,
        location: e.location,
    }).collect();
    Ok(ValidationResponse { valid, errors: error_infos })
 }
--- a/desktop/src-tauri/src/lib.rs
+++ b/desktop/src-tauri/src/lib.rs
@@ -146,6 +146,9 @@ pub fn run() {
            kernel_commands::skill::skill_create,
            kernel_commands::skill::skill_update,
            kernel_commands::skill::skill_delete,
            // Orchestration commands (multi-skill graphs)
            kernel_commands::orchestration::orchestration_execute,
            kernel_commands::orchestration::orchestration_validate,
            // Hands commands (autonomous capabilities)
            kernel_commands::hand::hand_list,
            kernel_commands::hand::hand_execute,