From 37997a204c155eee895c2a0e2afc5e7c4bcab5f5 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Tue, 24 Jun 2025 08:54:31 -0400
Subject: [PATCH 01/14] take 1

---
 .gitignore                                    |    4 +-
 crates/stepflow-analysis/src/tracker.rs       |   10 +
 crates/stepflow-builtins/src/eval.rs          |   10 +
 crates/stepflow-core/src/flow_result.rs       |   22 +
 crates/stepflow-core/src/workflow/step.rs     |    6 +
 crates/stepflow-execution/src/executor.rs     |   99 +-
 .../stepflow-execution/src/value_resolver.rs  |   15 +
 .../src/workflow_executor.rs                  |  384 ++++++-
 crates/stepflow-main/src/repl.rs              |    9 +
 crates/stepflow-plugin/src/context.rs         |   14 +
 crates/stepflow-plugin/src/error.rs           |    8 +
 crates/stepflow-plugin/src/lib.rs             |    2 +-
 crates/stepflow-protocol/src/blob_handlers.rs |   57 +
 .../stepflow-protocol/src/incoming_handler.rs |    3 +-
 crates/stepflow-protocol/src/lib.rs           |    2 +-
 crates/stepflow-server/src/api/debug.rs       |    1 +
 crates/stepflow-server/src/api/runs.rs        |   13 +
 examples/audio-streaming-pipeline.yaml        |   82 ++
 examples/audio_input.json                     |   12 +
 examples/stepflow-config.yml                  |    7 +
 examples/test_audio_pipeline.sh               |   94 ++
 sdks/python/pyproject.toml                    |    3 +
 .../src/stepflow_sdk/audio_components.py      | 1016 +++++++++++++++++
 sdks/python/src/stepflow_sdk/main.py          |    6 +
 sdks/python/src/stepflow_sdk/server.py        |   68 +-
 sdks/python/uv.lock                           |   92 ++
 26 files changed, 1970 insertions(+), 69 deletions(-)
 create mode 100644 examples/audio-streaming-pipeline.yaml
 create mode 100644 examples/audio_input.json
 create mode 100644 examples/stepflow-config.yml
 create mode 100755 examples/test_audio_pipeline.sh
 create mode 100644 sdks/python/src/stepflow_sdk/audio_components.py
diff --git a/.gitignore b/.gitignore
index 7f5e57bb..55bfeb44 100644
--- a/.gitignore
+++ b/.gitignore
@@ -47,4 +47,6 @@ Thumbs.db
 
 # Project specific
 target
-TODO.md
\ No newline at end of file
+TODO.md
+
+*.wav
diff --git a/crates/stepflow-analysis/src/tracker.rs b/crates/stepflow-analysis/src/tracker.rs
index d0a3aa87..81bd307f 100644
--- a/crates/stepflow-analysis/src/tracker.rs
+++ b/crates/stepflow-analysis/src/tracker.rs
@@ -87,6 +87,16 @@ pub struct DependencyTracker {
     completed: BitSet,
 }
 
+impl Clone for DependencyTracker {
+    fn clone(&self) -> Self {
+        Self {
+            dependencies: self.dependencies.clone(),
+            blocking: self.blocking.clone(),
+            completed: self.completed.clone(),
+        }
+    }
+}
+
 impl DependencyTracker {
     pub fn new(dependencies: Arc<Dependencies>) -> Self {
         let blocking = dependencies
diff --git a/crates/stepflow-builtins/src/eval.rs b/crates/stepflow-builtins/src/eval.rs
index 9a4b10b5..89c925d5 100644
--- a/crates/stepflow-builtins/src/eval.rs
+++ b/crates/stepflow-builtins/src/eval.rs
@@ -84,6 +84,16 @@ impl BuiltinComponent for EvalComponent {
         let result_value = match nested_result {
             FlowResult::Success { result } => result.as_ref().clone(),
             FlowResult::Skipped => serde_json::Value::Null,
+            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                // For streaming results, return the metadata and chunk info
+                serde_json::json!({
+                    "stream_id": stream_id,
+                    "metadata": metadata.as_ref(),
+                    "chunk": chunk,
+                    "chunk_index": chunk_index,
+                    "is_final": is_final
+                })
+            }
             FlowResult::Failed { error } => {
                 // Propagate the failure from the nested workflow
                 return Ok(FlowResult::Failed { error });
diff --git a/crates/stepflow-core/src/flow_result.rs b/crates/stepflow-core/src/flow_result.rs
index 55625d56..5c6af92d 100644
--- a/crates/stepflow-core/src/flow_result.rs
+++ b/crates/stepflow-core/src/flow_result.rs
@@ -49,6 +49,19 @@ impl FlowError {
 pub enum FlowResult {
     /// The step execution was successful.
     Success { result: ValueRef },
+    /// The step is streaming data.
+    Streaming { 
+        /// Stream identifier
+        stream_id: String,
+        /// Metadata about the stream
+        metadata: ValueRef,
+        /// Base64 encoded chunk data
+        chunk: String,
+        /// Chunk index
+        chunk_index: usize,
+        /// Whether this is the final chunk
+        is_final: bool,
+    },
     /// The step was skipped.
     Skipped,
     /// The step failed with the given error.
@@ -70,6 +83,15 @@ impl FlowResult {
         }
     }
 
+    pub fn streaming(&self) -> Option<(String, ValueRef, String, usize, bool)> {
+        match self {
+            Self::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                Some((stream_id.clone(), metadata.clone(), chunk.clone(), *chunk_index, *is_final))
+            }
+            _ => None,
+        }
+    }
+
     pub fn skipped(&self) -> bool {
         matches!(self, Self::Skipped)
     }
diff --git a/crates/stepflow-core/src/workflow/step.rs b/crates/stepflow-core/src/workflow/step.rs
index 31da8829..a529ad7e 100644
--- a/crates/stepflow-core/src/workflow/step.rs
+++ b/crates/stepflow-core/src/workflow/step.rs
@@ -28,6 +28,10 @@ pub struct Step {
     /// Arguments to pass to the component for this step
     #[serde(default, skip_serializing_if = "ValueRef::is_null")]
     pub input: ValueRef,
+
+    /// Whether this step is a streaming step (doesn't persist results)
+    #[serde(default, skip_serializing_if = "std::ops::Not::not")]
+    pub streaming: bool,
 }
 
 #[derive(
@@ -134,6 +138,7 @@ mod tests {
                 default_value: Some(ValueRef::from("fallback")),
             },
             input: serde_json::Value::Null.into(),
+            streaming: false,
         };
 
         let yaml = serde_yaml_ng::to_string(&step).unwrap();
@@ -152,6 +157,7 @@ mod tests {
             skip_if: None,
             on_error: ErrorAction::Fail,
             input: serde_json::Value::Null.into(),
+            streaming: false,
         };
 
         let yaml = serde_yaml_ng::to_string(&step).unwrap();
diff --git a/crates/stepflow-execution/src/executor.rs b/crates/stepflow-execution/src/executor.rs
index 7610bf93..a28ec5ed 100644
--- a/crates/stepflow-execution/src/executor.rs
+++ b/crates/stepflow-execution/src/executor.rs
@@ -150,6 +150,31 @@ impl StepFlowExecutor {
 
         Ok(workflow_executor)
     }
+
+    /// Get a workflow executor for debug sessions
+    pub async fn get_workflow_executor(
+        &self,
+        execution_id: Uuid,
+    ) -> Result<Option<WorkflowExecutor>> {
+        let debug_sessions = self.debug_sessions.read().await;
+        Ok(debug_sessions.get(&execution_id).cloned())
+    }
+
+    /// Get a mutable workflow executor for debug sessions
+    pub async fn get_workflow_executor_mut(
+        &self,
+        execution_id: Uuid,
+    ) -> Result<Option<WorkflowExecutor>> {
+        let mut debug_sessions = self.debug_sessions.write().await;
+        Ok(debug_sessions.get_mut(&execution_id).cloned())
+    }
+
+    /// Get the flow for a specific execution (for streaming pipeline coordinator)
+    pub fn flow(&self) -> Option<Arc<Flow>> {
+        // This is a placeholder - in a real implementation, we'd need to store flows
+        // For now, return None since we don't have access to the flow
+        None
+    }
 }
 
 impl Context for StepFlowExecutor {
@@ -237,38 +262,18 @@ impl Context for StepFlowExecutor {
         &self,
         execution_id: Uuid,
     ) -> BoxFuture<'_, stepflow_plugin::Result<FlowResult>> {
+        let pending = self.pending.clone();
+
         async move {
-            // Remove and get the receiver for this execution
-            let receiver = {
-                let pending = self.pending.read().await;
-                pending.get(&execution_id).cloned()
-            };
-
-            match receiver {
-                Some(rx) => {
-                    match rx.await {
-                        Ok(result) => Ok(result),
-                        Err(_) => {
-                            // The sender was dropped, indicating the execution was cancelled or failed
-                            Ok(FlowResult::Failed {
-                                error: stepflow_core::FlowError::new(
-                                    410,
-                                    "Nested flow execution was cancelled",
-                                ),
-                            })
-                        }
-                    }
-                }
-                None => {
-                    // Execution ID not found
-                    Ok(FlowResult::Failed {
-                        error: stepflow_core::FlowError::new(
-                            404,
-                            format!("No execution found for ID: {}", execution_id),
-                        ),
-                    })
-                }
-            }
+            let pending = pending.read().await;
+            let future = pending
+                .get(&execution_id)
+                .ok_or_else(|| stepflow_plugin::PluginError::new("Execution not found"))
+                .change_context(stepflow_plugin::PluginError::new("Execution not found"))?
+                .clone();
+
+            future.await.map_err(|_| stepflow_plugin::PluginError::new("Execution failed"))
+                .change_context(stepflow_plugin::PluginError::new("Execution failed"))
         }
         .boxed()
     }
@@ -276,6 +281,38 @@ impl Context for StepFlowExecutor {
     fn state_store(&self) -> &Arc<dyn StateStore> {
         &self.state_store
     }
+
+    fn executor(&self) -> Option<Arc<dyn stepflow_plugin::Executor>> {
+        Some(Arc::new(StepFlowExecutorWrapper(self.self_weak.clone())))
+    }
+}
+
+/// Wrapper to provide Executor trait implementation for StepFlowExecutor
+struct StepFlowExecutorWrapper(std::sync::Weak<StepFlowExecutor>);
+
+impl stepflow_plugin::Executor for StepFlowExecutorWrapper {
+    fn get_workflow_executor(
+        &self,
+        execution_id: Uuid,
+    ) -> BoxFuture<'_, stepflow_plugin::Result<Option<Box<dyn std::any::Any + Send + Sync>>>> {
+        let weak = self.0.clone();
+        
+        async move {
+            if let Some(executor) = weak.upgrade() {
+                match executor.get_workflow_executor(execution_id).await {
+                    Ok(Some(workflow_executor)) => {
+                        Ok(Some(Box::new(workflow_executor) as Box<dyn std::any::Any + Send + Sync>))
+                    }
+                    Ok(None) => Ok(None),
+                    Err(e) => Err(stepflow_plugin::PluginError::new(format!("Failed to get workflow executor: {:?}", e)))
+                        .change_context(stepflow_plugin::PluginError::new("Failed to get workflow executor")),
+                }
+            } else {
+                Ok(None)
+            }
+        }
+        .boxed()
+    }
 }
 
 #[cfg(test)]
diff --git a/crates/stepflow-execution/src/value_resolver.rs b/crates/stepflow-execution/src/value_resolver.rs
index c505e1c5..cdb804f9 100644
--- a/crates/stepflow-execution/src/value_resolver.rs
+++ b/crates/stepflow-execution/src/value_resolver.rs
@@ -10,6 +10,7 @@ use uuid::Uuid;
 use crate::{ExecutionError, Result};
 
 /// Value resolver for handling expression and JSON value resolution
+#[derive(Clone)]
 pub struct ValueResolver {
     /// Execution ID of the workflow we are resolving for.
     ///
@@ -97,6 +98,10 @@ impl ValueResolver {
         // NOTE: Skip actions are applied after path resolution.
         match path_result {
             FlowResult::Success { result } => Ok(FlowResult::Success { result }),
+            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                // For streaming results, we can't apply skip actions, so just pass through
+                Ok(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final })
+            }
             FlowResult::Skipped => {
                 match expr.on_skip() {
                     Some(SkipAction::UseDefault { default_value }) => {
@@ -151,6 +156,11 @@ impl ValueResolver {
                         FlowResult::Success { result } => {
                             result_map.insert(k.clone(), result.as_ref().clone());
                         }
+                        FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                            // For streaming results in objects, we can't handle them properly
+                            // Return the streaming result as-is
+                            return Ok(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final });
+                        }
                         FlowResult::Skipped => {
                             return Ok(FlowResult::Skipped);
                         }
@@ -171,6 +181,11 @@ impl ValueResolver {
                         FlowResult::Success { result } => {
                             result_array.push(result.as_ref().clone());
                         }
+                        FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                            // For streaming results in arrays, we can't handle them properly
+                            // Return the streaming result as-is
+                            return Ok(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final });
+                        }
                         FlowResult::Skipped => {
                             return Ok(FlowResult::Skipped);
                         }
diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index a3d7d628..18633665 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -12,6 +12,7 @@ use stepflow_core::{
 use stepflow_plugin::{DynPlugin, ExecutionContext, Plugin as _};
 use stepflow_state::{StateStore, StepResult};
 use uuid::Uuid;
+use tokio::sync::{mpsc, oneshot};
 
 use crate::{ExecutionError, Result, StepFlowExecutor, value_resolver::ValueResolver};
 
@@ -40,6 +41,7 @@ pub(crate) async fn execute_workflow(
 ///
 /// This serves as the core execution engine that can be used directly for
 /// run-to-completion execution, or controlled step-by-step by the debug session.
+#[derive(Clone)]
 pub struct WorkflowExecutor {
     /// Dependency tracker for determining runnable steps
     tracker: stepflow_analysis::DependencyTracker,
@@ -53,6 +55,8 @@ pub struct WorkflowExecutor {
     flow: Arc<Flow>,
     /// Execution context for this session
     context: ExecutionContext,
+    /// Optional streaming pipeline coordinator
+    streaming_coordinator: Option<std::sync::Arc<tokio::sync::Mutex<StreamingPipelineCoordinator>>>,
 }
 
 impl WorkflowExecutor {
@@ -86,6 +90,7 @@ impl WorkflowExecutor {
             executor,
             flow,
             context,
+            streaming_coordinator: None,
         })
     }
 
@@ -369,6 +374,7 @@ impl WorkflowExecutor {
                     FlowResult::Success { .. } => CoreStepStatus::Completed,
                     FlowResult::Skipped => CoreStepStatus::Skipped,
                     FlowResult::Failed { .. } => CoreStepStatus::Failed,
+                    FlowResult::Streaming { .. } => CoreStepStatus::Running, // Streaming steps are considered running
                 },
                 Err(_) => CoreStepStatus::Blocked,
             }
@@ -421,24 +427,19 @@ impl WorkflowExecutor {
         // Resolve step inputs
         let step_input = match self.resolver.resolve(&step.input).await? {
             FlowResult::Success { result } => result,
+            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                // For streaming steps, we can handle streaming inputs
+                // For now, just return the metadata as the input
+                metadata
+            }
             FlowResult::Skipped => {
-                // Step inputs contain skipped values - skip this step
-                let result = FlowResult::Skipped;
-                self.record_step_completion(step_index, &result).await?;
-                return Ok(StepExecutionResult::new(
-                    step_index,
-                    step_id,
-                    component_string,
-                    result,
-                ));
+                return Err(ExecutionError::StepNotRunnable {
+                    step: step_id.clone(),
+                }
+                .into());
             }
             FlowResult::Failed { error } => {
-                return Ok(StepExecutionResult::new(
-                    step_index,
-                    step_id,
-                    component_string,
-                    FlowResult::Failed { error },
-                ));
+                return Err(ExecutionError::StepFailed { step: step_id }.into());
             }
         };
 
@@ -446,8 +447,14 @@ impl WorkflowExecutor {
         let plugin = self.executor.get_plugin(&step.component).await?;
         let result = execute_step_async(plugin, step, step_input, self.context.clone()).await?;
 
-        // Record the result
-        self.record_step_completion(step_index, &result).await?;
+        // For streaming steps, don't record in state store
+        if step.streaming {
+            // Update dependency tracker but don't persist
+            self.tracker.complete_step(step_index);
+        } else {
+            // Record the result for non-streaming steps
+            self.record_step_completion(step_index, &result).await?;
+        }
 
         Ok(StepExecutionResult::new(
             step_index,
@@ -502,6 +509,7 @@ impl WorkflowExecutor {
             FlowResult::Success { result } => Ok(result.is_truthy()),
             FlowResult::Skipped => Ok(false), // Don't skip if condition references skipped values
             FlowResult::Failed { .. } => Ok(false), // Don't skip if condition evaluation failed
+            FlowResult::Streaming { .. } => Ok(false), // Don't skip if condition references streaming values
         }
     }
 
@@ -553,6 +561,14 @@ impl WorkflowExecutor {
                             .union_with(&self.skip_step(&step_id, step_index).await?);
                         continue;
                     }
+                    Ok(FlowResult::Streaming { .. }) => {
+                        // Step inputs contain streaming values - this is not supported for regular steps
+                        tracing::error!(
+                            "Step {} has streaming inputs which is not supported for non-streaming steps",
+                            step_id
+                        );
+                        return Err(ExecutionError::StepFailed { step: step_id }.into());
+                    }
                     Ok(FlowResult::Failed { error }) => {
                         tracing::error!(
                             "Failed to resolve inputs for step {} - input resolution failed: {:?}",
@@ -637,6 +653,218 @@ impl WorkflowExecutor {
 
         Ok(())
     }
+
+    /// Execute a streaming step continuously.
+    /// This method runs the step in a loop, processing chunks as they arrive.
+    pub async fn execute_streaming_step(
+        &mut self,
+        step_index: usize,
+    ) -> Result<()> {
+        let step = &self.flow.steps[step_index];
+        let step_id = step.id.clone();
+
+        // Check if the step is runnable
+        if !self.tracker.unblocked_steps().contains(step_index) {
+            return Err(ExecutionError::StepNotRunnable {
+                step: step.id.clone(),
+            }
+            .into());
+        }
+
+        // Check if this is actually a streaming step
+        if !step.streaming {
+            return Err(ExecutionError::StepNotRunnable {
+                step: step.id.clone(),
+            }
+            .into());
+        }
+
+        // Check if this is part of a streaming pipeline
+        if self.is_streaming_pipeline_step(step_index) {
+            return self.execute_streaming_pipeline_step(step_index).await;
+        }
+
+        // Fallback to individual streaming step execution
+        self.execute_individual_streaming_step(step_index).await
+    }
+
+    /// Check if a step is part of a streaming pipeline (has streaming inputs/outputs)
+    fn is_streaming_pipeline_step(&self, step_index: usize) -> bool {
+        let step = &self.flow.steps[step_index];
+        
+        // Check if this step has streaming inputs from other streaming steps
+        for (other_index, other_step) in self.flow.steps.iter().enumerate() {
+            if other_index != step_index && other_step.streaming {
+                // Check if this step references the other streaming step
+                if self.step_references_other_step(step, other_step) {
+                    return true;
+                }
+            }
+        }
+        
+        false
+    }
+
+    /// Check if a step references another step in its inputs
+    fn step_references_other_step(&self, step: &stepflow_core::workflow::Step, other_step: &stepflow_core::workflow::Step) -> bool {
+        // Simple check: look for step references in the input
+        let input_str = serde_json::to_string(&step.input).unwrap_or_default();
+        input_str.contains(&format!("step: {}", other_step.id))
+    }
+
+    /// Execute a step that's part of a streaming pipeline
+    async fn execute_streaming_pipeline_step(&mut self, step_index: usize) -> Result<()> {
+        let step = &self.flow.steps[step_index];
+        let step_id = step.id.clone();
+
+        tracing::info!("Executing streaming pipeline step: {}", step_id);
+
+        // Find all streaming steps in the pipeline
+        let pipeline_steps = self.find_streaming_pipeline_steps(step_index);
+        
+        // Create a streaming coordinator and store it
+        let coordinator = std::sync::Arc::new(tokio::sync::Mutex::new(StreamingPipelineCoordinator::new(
+            self.executor.clone(),
+            pipeline_steps,
+            self.context.clone(),
+        )));
+        self.streaming_coordinator = Some(coordinator.clone());
+
+        // Execute the entire pipeline
+        coordinator.lock().await.execute_pipeline().await?;
+
+        // Update dependency tracker
+        self.tracker.complete_step(step_index);
+
+        Ok(())
+    }
+
+    /// Find all steps that are part of the same streaming pipeline
+    fn find_streaming_pipeline_steps(&self, start_step_index: usize) -> Vec<usize> {
+        let mut pipeline_steps = vec![start_step_index];
+        let mut to_check = vec![start_step_index];
+        let mut checked = std::collections::HashSet::new();
+
+        while let Some(step_index) = to_check.pop() {
+            if checked.contains(&step_index) {
+                continue;
+            }
+            checked.insert(step_index);
+
+            let step = &self.flow.steps[step_index];
+            
+            // Find steps that this step depends on (streaming inputs)
+            for (other_index, other_step) in self.flow.steps.iter().enumerate() {
+                if other_step.streaming && self.step_references_other_step(step, other_step) {
+                    if !pipeline_steps.contains(&other_index) {
+                        pipeline_steps.push(other_index);
+                        to_check.push(other_index);
+                    }
+                }
+            }
+
+            // Find steps that depend on this step (streaming outputs)
+            for (other_index, other_step) in self.flow.steps.iter().enumerate() {
+                if other_step.streaming && self.step_references_other_step(other_step, step) {
+                    if !pipeline_steps.contains(&other_index) {
+                        pipeline_steps.push(other_index);
+                        to_check.push(other_index);
+                    }
+                }
+            }
+        }
+
+        pipeline_steps.sort();
+        pipeline_steps
+    }
+
+    /// Execute an individual streaming step (fallback)
+    async fn execute_individual_streaming_step(&mut self, step_index: usize) -> Result<()> {
+        let step = &self.flow.steps[step_index];
+        let step_id = step.id.clone();
+
+        // Resolve step inputs
+        let step_input = match self.resolver.resolve(&step.input).await? {
+            FlowResult::Success { result } => result,
+            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                // For streaming steps, we can handle streaming inputs
+                // For now, just return the metadata as the input
+                metadata
+            }
+            FlowResult::Skipped => {
+                return Err(ExecutionError::StepNotRunnable {
+                    step: step_id.clone(),
+                }
+                .into());
+            }
+            FlowResult::Failed { error } => {
+                return Err(ExecutionError::StepFailed { step: step_id }.into());
+            }
+        };
+
+        // Get plugin
+        let plugin = self.executor.get_plugin(&step.component).await?;
+
+        // Execute streaming step in a loop
+        let mut chunk_index = 0;
+        loop {
+            let result = execute_step_async(plugin.clone(), step, step_input.clone(), self.context.clone()).await?;
+            
+            match result {
+                FlowResult::Streaming { stream_id, metadata, chunk, chunk_index: _, is_final } => {
+                    // Process the streaming chunk
+                    tracing::debug!(
+                        "Streaming step {} chunk {}: stream_id={}, is_final={}",
+                        step_id, chunk_index, stream_id, is_final
+                    );
+                    
+                    // Here you could emit the chunk to downstream steps or external consumers
+                    // For now, we just log it
+                    
+                    chunk_index += 1;
+                    
+                    if is_final {
+                        break;
+                    }
+                }
+                FlowResult::Success { result } => {
+                    // Non-streaming result, treat as final
+                    tracing::debug!("Streaming step {} completed with success", step_id);
+                    break;
+                }
+                FlowResult::Failed { error } => {
+                    tracing::error!("Streaming step {} failed: {:?}", step_id, error);
+                    return Err(ExecutionError::StepFailed { step: step_id }.into());
+                }
+                FlowResult::Skipped => {
+                    tracing::debug!("Streaming step {} skipped", step_id);
+                    break;
+                }
+            }
+        }
+
+        // Update dependency tracker for streaming step
+        self.tracker.complete_step(step_index);
+
+        Ok(())
+    }
+
+    /// Route a streaming chunk to the appropriate streaming pipeline
+    pub async fn route_streaming_chunk(&mut self, chunk: serde_json::Value) -> Result<()> {
+        tracing::debug!("Routing streaming chunk to workflow executor");
+        
+        // For now, we'll just log the chunk
+        // In a full implementation, this would route the chunk to the appropriate streaming step
+        tracing::info!("Received streaming chunk: {:?}", chunk);
+        
+        // TODO: Implement proper chunk routing to streaming steps
+        // This would involve:
+        // 1. Finding which streaming step should receive this chunk
+        // 2. Sending it through the appropriate channel
+        // 3. Triggering the step to process the chunk
+        
+        Ok(())
+    }
 }
 
 /// Execute a single step asynchronously.
@@ -732,6 +960,128 @@ pub struct StepInspection {
     pub state: CoreStepStatus,
 }
 
+/// Coordinates streaming execution between multiple steps in a pipeline
+struct StreamingPipelineCoordinator {
+    executor: Arc<StepFlowExecutor>,
+    pipeline_steps: Vec<usize>,
+    context: ExecutionContext,
+    step_connections: std::collections::HashMap<usize, tokio::sync::mpsc::Sender<FlowResult>>,
+    step_receivers: std::collections::HashMap<usize, tokio::sync::mpsc::Receiver<FlowResult>>,
+}
+
+impl StreamingPipelineCoordinator {
+    fn new(
+        executor: Arc<StepFlowExecutor>,
+        pipeline_steps: Vec<usize>,
+        context: ExecutionContext,
+    ) -> Self {
+        let mut step_connections = std::collections::HashMap::new();
+        let mut step_receivers = std::collections::HashMap::new();
+
+        // Create channels for each step
+        for &step_index in &pipeline_steps {
+            let (tx, rx) = tokio::sync::mpsc::channel(100); // Buffer 100 chunks
+            step_connections.insert(step_index, tx);
+            step_receivers.insert(step_index, rx);
+        }
+
+        Self {
+            executor,
+            pipeline_steps,
+            context,
+            step_connections,
+            step_receivers,
+        }
+    }
+
+    async fn execute_pipeline(&mut self) -> Result<()> {
+        // For now, we'll just log that we're executing a streaming pipeline
+        // In a full implementation, this would coordinate all the streaming steps
+        tracing::info!("Executing streaming pipeline with {} steps", self.pipeline_steps.len());
+        
+        // TODO: Implement full streaming pipeline coordination
+        // This would involve:
+        // 1. Starting all streaming steps in parallel
+        // 2. Setting up channels between steps
+        // 3. Routing chunks between steps
+        // 4. Handling backpressure and flow control
+        
+        Ok(())
+    }
+
+    fn get_downstream_senders(&self, step_index: usize) -> Vec<tokio::sync::mpsc::Sender<FlowResult>> {
+        let mut senders = Vec::new();
+        
+        for &other_step_index in &self.pipeline_steps {
+            if other_step_index != step_index {
+                if let Some(sender) = self.step_connections.get(&other_step_index) {
+                    senders.push(sender.clone());
+                }
+            }
+        }
+        
+        senders
+    }
+
+    async fn run_streaming_step(
+        executor: Arc<StepFlowExecutor>,
+        step: &stepflow_core::workflow::Step,
+        step_input: stepflow_core::workflow::ValueRef,
+        context: ExecutionContext,
+        mut receiver: tokio::sync::mpsc::Receiver<FlowResult>,
+        downstream_senders: Vec<tokio::sync::mpsc::Sender<FlowResult>>,
+    ) -> Result<()> {
+        let step_id = step.id.clone();
+        let plugin = executor.get_plugin(&step.component).await?;
+
+        tracing::info!("Starting streaming step: {}", step_id);
+
+        // Execute the step to get initial result
+        let result = execute_step_async(plugin, step, step_input, context).await?;
+
+        match result {
+            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                // Send the chunk to downstream steps
+                for sender in &downstream_senders {
+                    let _ = sender.send(FlowResult::Streaming {
+                        stream_id: stream_id.clone(),
+                        metadata: metadata.clone(),
+                        chunk: chunk.clone(),
+                        chunk_index,
+                        is_final,
+                    }).await;
+                }
+
+                // Continue processing if not final
+                if !is_final {
+                    // Wait for input from upstream steps
+                    while let Some(input_chunk) = receiver.recv().await {
+                        // Process the input chunk and continue streaming
+                        // This is where you'd call the step again with the new input
+                        tracing::debug!("Step {} received chunk, continuing stream", step_id);
+                        
+                        // For now, just continue the loop
+                        // In a full implementation, you'd call the step again
+                        break;
+                    }
+                }
+            }
+            FlowResult::Success { result } => {
+                tracing::info!("Streaming step {} completed with success", step_id);
+            }
+            FlowResult::Failed { error } => {
+                tracing::error!("Streaming step {} failed: {:?}", step_id, error);
+                return Err(ExecutionError::StepFailed { step: step_id }.into());
+            }
+            FlowResult::Skipped => {
+                tracing::info!("Streaming step {} skipped", step_id);
+            }
+        }
+
+        Ok(())
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/crates/stepflow-main/src/repl.rs b/crates/stepflow-main/src/repl.rs
index 6332d93f..e1485f0b 100644
--- a/crates/stepflow-main/src/repl.rs
+++ b/crates/stepflow-main/src/repl.rs
@@ -674,6 +674,7 @@ async fn handle_completed_command(state: &ReplState) -> Result<()> {
                                 stepflow_core::FlowResult::Success { .. } => "SUCCESS",
                                 stepflow_core::FlowResult::Skipped => "SKIPPED",
                                 stepflow_core::FlowResult::Failed { .. } => "FAILED",
+                                stepflow_core::FlowResult::Streaming { .. } => "RUNNING",
                             };
                             println!(
                                 "  [{}] {} ({}): {}",
@@ -755,6 +756,14 @@ fn print_flow_result(result: &stepflow_core::FlowResult) -> Result<()> {
         stepflow_core::FlowResult::Failed { error } => {
             println!("Result: FAILED - {}", error);
         }
+        stepflow_core::FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+            println!("Result: STREAMING");
+            println!("  Stream ID: {}", stream_id);
+            println!("  Metadata: {}", serde_json::to_string_pretty(metadata).unwrap_or_else(|_| "<unserializable>".to_string()));
+            println!("  Chunk: {}... ({} bytes base64)", &chunk[..chunk.len().min(32)], chunk.len());
+            println!("  Chunk Index: {}", chunk_index);
+            println!("  Final: {}", is_final);
+        }
     }
     Ok(())
 }
diff --git a/crates/stepflow-plugin/src/context.rs b/crates/stepflow-plugin/src/context.rs
index 5a9e0b9f..4e55b56d 100644
--- a/crates/stepflow-plugin/src/context.rs
+++ b/crates/stepflow-plugin/src/context.rs
@@ -40,6 +40,20 @@ pub trait Context: Send + Sync {
 
     /// Get the state store for this executor.
     fn state_store(&self) -> &Arc<dyn StateStore>;
+
+    /// Get a reference to the executor for advanced operations.
+    fn executor(&self) -> Option<Arc<dyn Executor>> {
+        None
+    }
+}
+
+/// Trait for executor operations that require access to the StepFlowExecutor
+pub trait Executor: Send + Sync {
+    /// Get a workflow executor for debug sessions
+    fn get_workflow_executor(
+        &self,
+        execution_id: Uuid,
+    ) -> BoxFuture<'_, crate::Result<Option<Box<dyn std::any::Any + Send + Sync>>>>;
 }
 
 /// Execution context that combines a Context with an execution ID.
diff --git a/crates/stepflow-plugin/src/error.rs b/crates/stepflow-plugin/src/error.rs
index a2343fc5..0a1b647a 100644
--- a/crates/stepflow-plugin/src/error.rs
+++ b/crates/stepflow-plugin/src/error.rs
@@ -27,6 +27,14 @@ pub enum PluginError {
     InvalidInput,
     #[error("error creating plugin")]
     CreatePlugin,
+    #[error("generic error: {0}")]
+    Generic(String),
+}
+
+impl PluginError {
+    pub fn new(message: impl Into<String>) -> Self {
+        Self::Generic(message.into())
+    }
 }
 
 pub type Result<T, E = error_stack::Report<PluginError>> = std::result::Result<T, E>;
diff --git a/crates/stepflow-plugin/src/lib.rs b/crates/stepflow-plugin/src/lib.rs
index f85de956..f9f7fba1 100644
--- a/crates/stepflow-plugin/src/lib.rs
+++ b/crates/stepflow-plugin/src/lib.rs
@@ -2,6 +2,6 @@ mod context;
 mod error;
 mod plugin;
 
-pub use context::{Context, ExecutionContext};
+pub use context::{Context, ExecutionContext, Executor};
 pub use error::{PluginError, Result};
 pub use plugin::{DynPlugin, Plugin, PluginConfig};
diff --git a/crates/stepflow-protocol/src/blob_handlers.rs b/crates/stepflow-protocol/src/blob_handlers.rs
index 61cc2e58..62aa8ae5 100644
--- a/crates/stepflow-protocol/src/blob_handlers.rs
+++ b/crates/stepflow-protocol/src/blob_handlers.rs
@@ -159,3 +159,60 @@ impl IncomingHandler for GetBlobHandler {
         .boxed()
     }
 }
+
+/// Handler for streaming_chunk notifications from component servers.
+pub struct StreamingChunkHandler;
+
+impl IncomingHandler for StreamingChunkHandler {
+    fn handle_incoming(
+        &self,
+        _method: String,
+        params: Box<RawValue>,
+        id: Option<Uuid>,
+        response_tx: mpsc::Sender<String>,
+        context: Arc<dyn Context>,
+    ) -> BoxFuture<'static, error_stack::Result<(), StdioError>> {
+        async move {
+            // This is a notification (no ID), so we don't send a response
+            // Instead, we need to handle the streaming chunk
+            match serde_json::from_str::<StreamingChunkNotification>(params.get()) {
+                Ok(notification) => {
+                    tracing::info!("Received streaming chunk for request {}: {:?}", 
+                                  notification.request_id, notification.chunk);
+                    
+                    // Route this chunk to the appropriate workflow executor
+                    if let Some(executor) = context.executor() {
+                        if let Ok(execution_id) = Uuid::parse_str(&notification.request_id) {
+                            // Try to find the workflow executor for this execution
+                            if let Ok(Some(_boxed_executor)) = executor.get_workflow_executor(execution_id).await {
+                                // For now, just log that we received the chunk
+                                // TODO: Implement proper chunk routing when the streaming pipeline is ready
+                                tracing::info!("Received streaming chunk for execution {}: {:?}", 
+                                              execution_id, notification.chunk);
+                            } else {
+                                tracing::warn!("No workflow executor found for execution ID: {}", execution_id);
+                            }
+                        } else {
+                            tracing::warn!("Invalid execution ID in streaming chunk: {}", notification.request_id);
+                        }
+                    } else {
+                        tracing::warn!("No executor available in context for streaming chunk routing");
+                    }
+                    
+                    Ok(())
+                }
+                Err(e) => {
+                    tracing::error!("Failed to parse streaming chunk notification: {}", e);
+                    Ok(())
+                }
+            }
+        }
+        .boxed()
+    }
+}
+
+#[derive(Debug, Deserialize)]
+struct StreamingChunkNotification {
+    request_id: String,
+    chunk: serde_json::Value,
+}
diff --git a/crates/stepflow-protocol/src/incoming_handler.rs b/crates/stepflow-protocol/src/incoming_handler.rs
index 7efc6019..f61fdddc 100644
--- a/crates/stepflow-protocol/src/incoming_handler.rs
+++ b/crates/stepflow-protocol/src/incoming_handler.rs
@@ -7,7 +7,7 @@ use tokio::sync::mpsc;
 use uuid::Uuid;
 
 use crate::stdio::StdioError;
-use crate::{GetBlobHandler, PutBlobHandler};
+use crate::{GetBlobHandler, PutBlobHandler, StreamingChunkHandler};
 
 /// Trait for handling incoming method calls and notifications from component servers.
 ///
@@ -45,6 +45,7 @@ static INCOMING_HANDLERS: LazyLock<IncomingHandlerRegistry> = LazyLock::new(|| {
     let mut registry = IncomingHandlerRegistry::new();
     registry.register("put_blob", Box::new(PutBlobHandler));
     registry.register("get_blob", Box::new(GetBlobHandler));
+    registry.register("streaming_chunk", Box::new(StreamingChunkHandler));
     registry
 });
 
diff --git a/crates/stepflow-protocol/src/lib.rs b/crates/stepflow-protocol/src/lib.rs
index 2043a805..14e3f1de 100644
--- a/crates/stepflow-protocol/src/lib.rs
+++ b/crates/stepflow-protocol/src/lib.rs
@@ -4,5 +4,5 @@ mod incoming_handler;
 mod schema;
 pub mod stdio;
 
-pub use blob_handlers::{GetBlobHandler, PutBlobHandler};
+pub use blob_handlers::{GetBlobHandler, PutBlobHandler, StreamingChunkHandler};
 pub use incoming_handler::{IncomingHandler, IncomingHandlerRegistry};
diff --git a/crates/stepflow-server/src/api/debug.rs b/crates/stepflow-server/src/api/debug.rs
index 1d62c3c0..915ab5ed 100644
--- a/crates/stepflow-server/src/api/debug.rs
+++ b/crates/stepflow-server/src/api/debug.rs
@@ -109,6 +109,7 @@ pub async fn debug_continue(
     let status = match &final_result {
         FlowResult::Success { .. } => ExecutionStatus::Completed,
         FlowResult::Failed { .. } | FlowResult::Skipped => ExecutionStatus::Failed,
+        FlowResult::Streaming { .. } => ExecutionStatus::Running,
     };
 
     state_store
diff --git a/crates/stepflow-server/src/api/runs.rs b/crates/stepflow-server/src/api/runs.rs
index e5c76702..5c0165d2 100644
--- a/crates/stepflow-server/src/api/runs.rs
+++ b/crates/stepflow-server/src/api/runs.rs
@@ -212,6 +212,19 @@ pub async fn create_run(
                 debug: debug_mode,
             }))
         }
+        FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+            // For streaming workflows, mark as running
+            state_store
+                .update_execution_status(run_id, ExecutionStatus::Running, None)
+                .await?;
+
+            Ok(Json(CreateRunResponse {
+                run_id,
+                result: Some(flow_result),
+                status: ExecutionStatus::Running,
+                debug: debug_mode,
+            }))
+        }
         FlowResult::Failed { .. } | FlowResult::Skipped => {
             // Update execution status to failed
             state_store
diff --git a/examples/audio-streaming-pipeline.yaml b/examples/audio-streaming-pipeline.yaml
new file mode 100644
index 00000000..1e333f69
--- /dev/null
+++ b/examples/audio-streaming-pipeline.yaml
@@ -0,0 +1,82 @@
+name: Audio Streaming Pipeline
+description: Real-time audio processing pipeline with microphone input and file output
+
+input:
+  operation:
+    type: string
+    description: Audio processing operation (amplify, passthrough)
+    default: "amplify"
+  sample_rate:
+    type: integer
+    description: Audio sample rate in Hz
+    default: 44100
+  channels:
+    type: integer
+    description: Number of audio channels
+    default: 1
+  chunk_size:
+    type: integer
+    description: Size of audio chunks in samples
+    default: 1024
+  frequency:
+    type: number
+    description: Frequency for test sine wave (Hz)
+    default: 440.0
+  source:
+    type: string
+    description: Audio source (microphone, system_audio, sine_wave)
+    default: "microphone"
+  duration:
+    type: number
+    description: Recording duration in seconds
+    default: 5.0
+  output_file:
+    type: string
+    description: Output WAV file path
+    default: "output_audio.wav"
+  device_name:
+    type: string
+    description: Name of audio device to use
+    default: "C922 Pro Stream Webcam"
+
+steps:
+  # Streaming audio source that generates PCM chunks
+  - id: audio_source
+    component: python://audio_stream_source
+    streaming: true
+    input:
+      sample_rate: { $from: { workflow: input }, path: sample_rate }
+      channels: { $from: { workflow: input }, path: channels }
+      chunk_size: { $from: { workflow: input }, path: chunk_size }
+      frequency: { $from: { workflow: input }, path: frequency }
+      source: { $from: { workflow: input }, path: source }
+      duration: { $from: { workflow: input }, path: duration }
+      output_file: { $from: { workflow: input }, path: output_file }
+      device_name: { $from: { workflow: input }, path: device_name }
+
+  # Process the audio chunks
+  - id: process_chunk
+    component: python://audio_chunk_processor
+    streaming: true
+    input:
+      chunk: { $from: { step: audio_source }, path: chunk }
+      chunk_index: { $from: { step: audio_source }, path: chunk_index }
+      stream_id: { $from: { step: audio_source }, path: stream_id }
+      sample_rate: { $from: { step: audio_source }, path: sample_rate }
+      channels: { $from: { step: audio_source }, path: channels }
+      operation: { $from: { workflow: input }, path: operation }
+
+  # Output the processed chunks
+  - id: output_chunk
+    component: python://audio_sink
+    streaming: true
+    input:
+      chunk: { $from: { step: process_chunk }, path: chunk }
+      chunk_index: { $from: { step: process_chunk }, path: chunk_index }
+      stream_id: { $from: { step: process_chunk }, path: stream_id }
+      output_file: { $from: { workflow: input }, path: output_file }
+
+output:
+  processed_chunks: { $from: { step: output_chunk }, path: result }
+  source_metadata: { $from: { step: audio_source }, path: sample_rate }
+  processing_metadata: { $from: { step: process_chunk }, path: sample_rate } 
\ No newline at end of file
diff --git a/examples/audio_input.json b/examples/audio_input.json
new file mode 100644
index 00000000..2e0e7023
--- /dev/null
+++ b/examples/audio_input.json
@@ -0,0 +1,12 @@
+{
+  "operation": "amplify",
+  "sample_rate": 16000,
+  "channels": 1,
+  "chunk_size": 1024,
+  "frequency": 440.0,
+  "source": "microphone",
+  "duration": 3.0,
+  "output_file": "test_workflow_webcam.wav",
+  "device_name": "C922 Pro Stream Webcam",
+  "play_audio": true
+}
diff --git a/examples/stepflow-config.yml b/examples/stepflow-config.yml
new file mode 100644
index 00000000..9cb6a04c
--- /dev/null
+++ b/examples/stepflow-config.yml
@@ -0,0 +1,7 @@
+plugins:
+  - name: builtins
+    type: builtin
+  - name: python
+    type: stdio
+    command: /home/phact/Desktop/stepflow/sdks/python/.venv/bin/stepflow_sdk
+    args: [] 
\ No newline at end of file
diff --git a/examples/test_audio_pipeline.sh b/examples/test_audio_pipeline.sh
new file mode 100755
index 00000000..ddf37a45
--- /dev/null
+++ b/examples/test_audio_pipeline.sh
@@ -0,0 +1,94 @@
+#!/bin/bash
+
+# Audio Pipeline Test Script
+# Usage: ./test_audio_pipeline.sh [source] [operation] [duration] [output_file] [device_name]
+
+SOURCE=${1:-"microphone"}
+OPERATION=${2:-"amplify"}
+DURATION=${3:-"3.0"}
+OUTPUT_FILE=${4:-"test_workflow_webcam.wav"}
+DEVICE_NAME=${5:-"C922 Pro Stream Webcam"}
+
+# Detect if we're running from examples directory or root
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+CURRENT_DIR="$(pwd)"
+
+if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
+    # Running from examples directory
+    INPUT_FILE="audio_input.json"
+    FLOW_FILE="audio-streaming-pipeline.yaml"
+    INPUT_DIR="."
+else
+    # Running from root directory
+    INPUT_FILE="examples/input.json"
+    FLOW_FILE="examples/audio-streaming-pipeline.yaml"
+    INPUT_DIR="examples"
+fi
+
+echo "🎵 Testing Audio Streaming Pipeline"
+echo "Source: $SOURCE"
+echo "Operation: $OPERATION"
+echo "Duration: ${DURATION}s"
+echo "Output: $OUTPUT_FILE"
+echo "Device: $DEVICE_NAME"
+echo "Running from: $CURRENT_DIR"
+echo ""
+
+# Create input file
+if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
+    # Running from examples directory
+    cat > "$INPUT_FILE" << EOF
+{
+  "operation": "$OPERATION",
+  "sample_rate": 16000,
+  "channels": 1,
+  "chunk_size": 1024,
+  "frequency": 440.0,
+  "source": "$SOURCE",
+  "duration": $DURATION,
+  "output_file": "$OUTPUT_FILE",
+  "device_name": "$DEVICE_NAME",
+  "play_audio": true
+}
+EOF
+else
+    # Running from root directory
+    cat > "$INPUT_FILE" << EOF
+{
+  "operation": "$OPERATION",
+  "sample_rate": 16000,
+  "channels": 1,
+  "chunk_size": 1024,
+  "frequency": 440.0,
+  "source": "$SOURCE",
+  "duration": $DURATION,
+  "output_file": "$OUTPUT_FILE",
+  "device_name": "$DEVICE_NAME",
+  "play_audio": true
+}
+EOF
+fi
+
+# Run the workflow
+cd examples
+cargo run --bin stepflow -- run \
+  --flow audio-streaming-pipeline.yaml \
+  --input input.json
+cd ..
+
+echo ""
+echo "✅ Test completed!"
+echo "📁 Output file: $OUTPUT_FILE"
+
+# Check if file was created
+if [ -f "$OUTPUT_FILE" ]; then
+    echo "📊 File info:"
+    file "$OUTPUT_FILE"
+    echo "📏 File size: $(ls -lh $OUTPUT_FILE | awk '{print $5}')"
+    echo "🎵 Duration: $(soxi -D $OUTPUT_FILE 2>/dev/null || echo 'Unknown') seconds"
+else
+    echo "❌ Output file not found"
+fi
+
+# Clean up input file
+rm -f "$INPUT_FILE" 
diff --git a/sdks/python/pyproject.toml b/sdks/python/pyproject.toml
index 7aaeb343..607bfc54 100644
--- a/sdks/python/pyproject.toml
+++ b/sdks/python/pyproject.toml
@@ -8,6 +8,9 @@ requires-python = ">=3.13"
 dependencies = [
     "msgspec>=0.19.0",
     "jsonschema>=4.17.0",
+    "pyaudio>=0.2.11",
+    "sounddevice",
+    "numpy",
 ]
 
 [dependency-groups]
diff --git a/sdks/python/src/stepflow_sdk/audio_components.py b/sdks/python/src/stepflow_sdk/audio_components.py
new file mode 100644
index 00000000..7517c79f
--- /dev/null
+++ b/sdks/python/src/stepflow_sdk/audio_components.py
@@ -0,0 +1,1016 @@
+"""
+Audio streaming components for Stepflow.
+Supports PCM 16-bit audio streaming with base64 encoding.
+"""
+
+import base64
+import json
+import time
+import uuid
+from typing import Any, Dict, Optional
+from dataclasses import dataclass
+import pyaudio
+import wave
+import os
+import threading
+import queue
+import sys
+import numpy as np
+
+try:
+    import sounddevice as sd
+    SOUNDDEVICE_AVAILABLE = True
+except ImportError:
+    SOUNDDEVICE_AVAILABLE = False
+
+
+@dataclass
+class AudioChunk:
+    """Represents a chunk of PCM 16-bit audio data."""
+    data: bytes
+    sample_rate: int
+    channels: int
+    chunk_index: int
+    timestamp: float
+
+
+class StreamingPipeline:
+    """Coordinates streaming audio processing between components."""
+    
+    def __init__(self):
+        self.source_queue = queue.Queue()
+        self.processor_queue = queue.Queue()
+        self.sink_queue = queue.Queue()
+        self.running = False
+        self.threads = []
+    
+    def start_pipeline(self, source_config, processor_config, sink_config):
+        """Start the streaming pipeline with all components."""
+        self.running = True
+        
+        # Start source thread
+        source_thread = threading.Thread(
+            target=self._run_source, 
+            args=(source_config,), 
+            daemon=True
+        )
+        source_thread.start()
+        self.threads.append(source_thread)
+        
+        # Start processor thread
+        processor_thread = threading.Thread(
+            target=self._run_processor, 
+            args=(processor_config,), 
+            daemon=True
+        )
+        processor_thread.start()
+        self.threads.append(processor_thread)
+        
+        # Start sink thread
+        sink_thread = threading.Thread(
+            target=self._run_sink, 
+            args=(sink_config,), 
+            daemon=True
+        )
+        sink_thread.start()
+        self.threads.append(sink_thread)
+        
+        print("TIMING: Started streaming pipeline with 3 threads", file=sys.stderr)
+    
+    def _run_source(self, config):
+        """Run the audio source component."""
+        try:
+            # Initialize audio source
+            source_type = config.get('source', 'microphone')
+            sample_rate = config.get('sample_rate', 16000)
+            channels = config.get('channels', 1)
+            chunk_size = config.get('chunk_size', 1024)
+            duration = config.get('duration', 5.0)
+            device_name = config.get('device_name', None)
+            
+            # Calculate total chunks
+            chunk_duration = chunk_size / sample_rate
+            total_chunks = int(duration / chunk_duration)
+            
+            print(f"TIMING: Source starting with {total_chunks} chunks", file=sys.stderr)
+            
+            if source_type == 'microphone':
+                # Set up continuous recording
+                audio = pyaudio.PyAudio()
+                
+                # Find device
+                device_index = None
+                if device_name:
+                    for i in range(audio.get_device_count()):
+                        info = audio.get_device_info_by_index(i)
+                        if device_name.lower() in info['name'].lower():
+                            device_index = i
+                            break
+                
+                # Auto-detect sample rate
+                if device_index is not None:
+                    sample_rates = [16000, 22050, 44100, 48000]
+                    for rate in sample_rates:
+                        try:
+                            test_stream = audio.open(
+                                format=pyaudio.paInt16,
+                                channels=channels,
+                                rate=rate,
+                                input=True,
+                                input_device_index=device_index,
+                                frames_per_buffer=chunk_size
+                            )
+                            test_stream.close()
+                            sample_rate = rate
+                            break
+                        except OSError:
+                            continue
+                
+                # Start recording
+                stream = audio.open(
+                    format=pyaudio.paInt16,
+                    channels=channels,
+                    rate=sample_rate,
+                    input=True,
+                    input_device_index=device_index,
+                    frames_per_buffer=chunk_size
+                )
+                
+                print(f"TIMING: Started continuous recording at {sample_rate}Hz", file=sys.stderr)
+                
+                # Record and emit chunks
+                for chunk_index in range(total_chunks):
+                    if not self.running:
+                        break
+                    
+                    chunk_start = time.time()
+                    data = stream.read(chunk_size, exception_on_overflow=False)
+                    chunk_time = time.time()
+                    
+                    print(f"TIMING: Source recorded chunk {chunk_index} in {chunk_time - chunk_start:.4f}s", file=sys.stderr)
+                    
+                    # Emit to processor
+                    chunk_data = {
+                        "outcome": "streaming",
+                        "stream_id": str(uuid.uuid4()),
+                        "sample_rate": sample_rate,
+                        "channels": channels,
+                        "chunk_size": len(data),
+                        "format": "pcm_16bit",
+                        "chunk": base64.b64encode(data).decode('utf-8'),
+                        "chunk_index": chunk_index,
+                        "is_final": chunk_index >= total_chunks - 1
+                    }
+                    
+                    self.source_queue.put(chunk_data)
+                
+                stream.stop_stream()
+                stream.close()
+                audio.terminate()
+                
+            else:
+                # Generate test data
+                for chunk_index in range(total_chunks):
+                    if not self.running:
+                        break
+                    
+                    # Generate sine wave
+                    import math
+                    samples = []
+                    for i in range(chunk_size):
+                        t = (i + chunk_index * chunk_size) / sample_rate
+                        sample = int(32767 * 0.3 * math.sin(2 * math.pi * 440.0 * t))
+                        samples.append(sample)
+                    
+                    data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in samples)
+                    
+                    chunk_data = {
+                        "outcome": "streaming",
+                        "stream_id": str(uuid.uuid4()),
+                        "sample_rate": sample_rate,
+                        "channels": channels,
+                        "chunk_size": len(data),
+                        "format": "pcm_16bit",
+                        "chunk": base64.b64encode(data).decode('utf-8'),
+                        "chunk_index": chunk_index,
+                        "is_final": chunk_index >= total_chunks - 1
+                    }
+                    
+                    self.source_queue.put(chunk_data)
+            
+            print("TIMING: Source completed", file=sys.stderr)
+            
+        except Exception as e:
+            print(f"ERROR: Source failed: {e}", file=sys.stderr)
+    
+    def _run_processor(self, config):
+        """Run the audio processor component."""
+        try:
+            operation = config.get('operation', 'passthrough')
+            print(f"TIMING: Processor starting with operation: {operation}", file=sys.stderr)
+            
+            while self.running:
+                try:
+                    # Get chunk from source (with timeout)
+                    source_chunk = self.source_queue.get(timeout=1.0)
+                    
+                    if source_chunk.get('is_final', False):
+                        # Pass through final chunk
+                        self.processor_queue.put(source_chunk)
+                        break
+                    
+                    chunk_start = time.time()
+                    
+                    # Process the chunk
+                    if operation == 'amplify':
+                        # Decode and amplify
+                        chunk_data = base64.b64decode(source_chunk['chunk'])
+                        samples = []
+                        for i in range(0, len(chunk_data), 2):
+                            sample = int.from_bytes(chunk_data[i:i+2], 'little', signed=True)
+                            samples.append(sample)
+                        
+                        # Amplify
+                        gain = config.get('gain', 2.0)
+                        amplified_samples = [int(sample * gain) for sample in samples]
+                        amplified_data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in amplified_samples)
+                        amplified_b64 = base64.b64encode(amplified_data).decode('utf-8')
+                        
+                        processed_chunk = {
+                            **source_chunk,
+                            "chunk": amplified_b64,
+                            "operation": "amplify",
+                            "gain": gain
+                        }
+                    else:
+                        # Passthrough
+                        processed_chunk = {**source_chunk, "operation": "passthrough"}
+                    
+                    chunk_time = time.time()
+                    print(f"TIMING: Processor processed chunk {source_chunk['chunk_index']} in {chunk_time - chunk_start:.4f}s", file=sys.stderr)
+                    
+                    # Emit to sink
+                    self.processor_queue.put(processed_chunk)
+                    
+                except queue.Empty:
+                    continue
+            
+            print("TIMING: Processor completed", file=sys.stderr)
+            
+        except Exception as e:
+            print(f"ERROR: Processor failed: {e}", file=sys.stderr)
+    
+    def _run_sink(self, config):
+        """Run the audio sink component."""
+        try:
+            output_file = config.get('output_file', 'output_audio.wav')
+            all_chunks = []
+            
+            print(f"TIMING: Sink starting, will write to {output_file}", file=sys.stderr)
+            
+            while self.running:
+                try:
+                    # Get chunk from processor (with timeout)
+                    processed_chunk = self.processor_queue.get(timeout=1.0)
+                    
+                    chunk_start = time.time()
+                    
+                    # Decode and store chunk
+                    chunk_data = base64.b64decode(processed_chunk['chunk'])
+                    all_chunks.append(chunk_data)
+                    
+                    chunk_time = time.time()
+                    print(f"TIMING: Sink received chunk {processed_chunk['chunk_index']} in {chunk_time - chunk_start:.4f}s", file=sys.stderr)
+                    
+                    if processed_chunk.get('is_final', False):
+                        break
+                        
+                except queue.Empty:
+                    continue
+            
+            # Write WAV file
+            if all_chunks:
+                try:
+                    all_audio_data = b''.join(all_chunks)
+                    sample_rate = processed_chunk.get('sample_rate', 16000)
+                    channels = processed_chunk.get('channels', 1)
+                    
+                    with wave.open(output_file, 'wb') as wav_file:
+                        wav_file.setnchannels(channels)
+                        wav_file.setsampwidth(2)  # 16-bit
+                        wav_file.setframerate(sample_rate)
+                        wav_file.writeframes(all_audio_data)
+                    
+                    print(f"TIMING: Sink wrote {len(all_audio_data)} bytes to {output_file}", file=sys.stderr)
+                    
+                except Exception as e:
+                    print(f"ERROR: Failed to write WAV file: {e}", file=sys.stderr)
+            
+            print("TIMING: Sink completed", file=sys.stderr)
+            
+        except Exception as e:
+            print(f"ERROR: Sink failed: {e}", file=sys.stderr)
+    
+    def stop_pipeline(self):
+        """Stop the streaming pipeline."""
+        self.running = False
+        for thread in self.threads:
+            thread.join(timeout=2.0)
+        print("TIMING: Pipeline stopped", file=sys.stderr)
+
+
+# Global pipeline instance
+_pipeline = None
+
+
+class AudioStreamSource:
+    """Component that generates PCM 16-bit audio chunks from a source."""
+    
+    def __init__(self, sample_rate: int = 16000, channels: int = 1, chunk_size: int = 1024):
+        self.sample_rate = sample_rate
+        self.channels = channels
+        self.chunk_size = chunk_size
+        self.stream_id = str(uuid.uuid4())
+        self.chunk_index = 0
+        self.audio = pyaudio.PyAudio()
+        self.stream = None
+        self.is_recording = False
+        self.audio_queue = queue.Queue()
+        
+    def start_microphone_stream(self):
+        """Start recording from microphone."""
+        self.stream = self.audio.open(
+            format=pyaudio.paInt16,
+            channels=self.channels,
+            rate=self.sample_rate,
+            input=True,
+            frames_per_buffer=self.chunk_size
+        )
+        self.is_recording = True
+        
+        # Start recording thread
+        threading.Thread(target=self._record_audio, daemon=True).start()
+        
+    def _record_audio(self):
+        """Record audio in background thread."""
+        try:
+            while self.is_recording:
+                if self.stream:
+                    data = self.stream.read(self.chunk_size, exception_on_overflow=False)
+                    self.audio_queue.put(data)
+        except Exception as e:
+            print(f"Recording error: {e}")
+            
+    def stop_microphone_stream(self):
+        """Stop recording from microphone."""
+        self.is_recording = False
+        if self.stream:
+            self.stream.stop_stream()
+            self.stream.close()
+        if self.audio:
+            self.audio.terminate()
+        
+    def get_microphone_chunk(self) -> AudioChunk:
+        """Get a chunk from microphone input."""
+        try:
+            data = self.audio_queue.get(timeout=1.0)  # 1 second timeout
+            chunk = AudioChunk(
+                data=data,
+                sample_rate=self.sample_rate,
+                channels=self.channels,
+                chunk_index=self.chunk_index,
+                timestamp=time.time()
+            )
+            self.chunk_index += 1
+            return chunk
+        except queue.Empty:
+            # Return silence if no audio available
+            silence_data = b'\x00' * (self.chunk_size * 2)  # 16-bit = 2 bytes per sample
+            chunk = AudioChunk(
+                data=silence_data,
+                sample_rate=self.sample_rate,
+                channels=self.channels,
+                chunk_index=self.chunk_index,
+                timestamp=time.time()
+            )
+            self.chunk_index += 1
+            return chunk
+        
+    def generate_sine_wave_chunk(self, frequency: float = 440.0, duration: float = 0.1) -> AudioChunk:
+        """Generate a sine wave chunk for testing."""
+        import math
+        
+        # Generate sine wave samples
+        samples = []
+        for i in range(self.chunk_size):
+            t = (i + self.chunk_index * self.chunk_size) / self.sample_rate
+            sample = int(32767 * 0.3 * math.sin(2 * math.pi * frequency * t))
+            samples.append(sample)
+        
+        # Convert to bytes (16-bit little-endian)
+        data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in samples)
+        
+        chunk = AudioChunk(
+            data=data,
+            sample_rate=self.sample_rate,
+            channels=self.channels,
+            chunk_index=self.chunk_index,
+            timestamp=time.time()
+        )
+        
+        self.chunk_index += 1
+        return chunk
+
+    def start_system_audio_stream(self):
+        """Start capturing system audio (speaker output)."""
+        try:
+            # Try to use PulseAudio loopback device first
+            self.stream = self.audio.open(
+                format=pyaudio.paInt16,
+                channels=self.channels,
+                rate=self.sample_rate,
+                input=True,
+                input_device_index=self._find_system_audio_device(),
+                frames_per_buffer=self.chunk_size
+            )
+            self.is_recording = True
+            print(f"Started system audio capture at {self.sample_rate}Hz")
+        except Exception as e:
+            print(f"Failed to start system audio capture: {e}")
+            # Fallback to default input device
+            self.stream = self.audio.open(
+                format=pyaudio.paInt16,
+                channels=self.channels,
+                rate=self.sample_rate,
+                input=True,
+                frames_per_buffer=self.chunk_size
+            )
+            self.is_recording = True
+            print(f"Fell back to default audio input at {self.sample_rate}Hz")
+    
+    def _find_system_audio_device(self):
+        """Find a suitable system audio capture device."""
+        try:
+            # List available devices
+            device_count = self.audio.get_device_count()
+            print(f"Found {device_count} audio devices:")
+            
+            for i in range(device_count):
+                device_info = self.audio.get_device_info_by_index(i)
+                name = device_info.get('name', 'Unknown')
+                max_inputs = device_info.get('maxInputChannels', 0)
+                print(f"  Device {i}: {name} (inputs: {max_inputs})")
+                
+                # Look for loopback, monitor, or system audio devices
+                if (max_inputs > 0 and 
+                    any(keyword in name.lower() for keyword in 
+                        ['loopback', 'monitor', 'system', 'speaker', 'output'])):
+                    print(f"  Selected system audio device: {name}")
+                    return i
+            
+            # If no specific system audio device found, try default
+            print("No specific system audio device found, using default")
+            return None
+            
+        except Exception as e:
+            print(f"Error finding system audio device: {e}")
+            return None
+    
+    def get_system_audio_chunk(self):
+        """Get a chunk of system audio data."""
+        if not self.is_recording or not self.stream:
+            raise RuntimeError("System audio stream not started")
+        
+        try:
+            # Read audio data
+            data = self.stream.read(self.chunk_size, exception_on_overflow=False)
+            
+            # Create audio chunk
+            chunk = AudioChunk(
+                data=data,
+                sample_rate=self.sample_rate,
+                channels=self.channels,
+                chunk_index=self.chunk_index,
+                timestamp=time.time()
+            )
+            
+            self.chunk_index += 1
+            return chunk
+            
+        except Exception as e:
+            print(f"Error reading system audio: {e}")
+            # Return silence on error
+            silence_data = b'\x00' * (self.chunk_size * 2)
+            chunk = AudioChunk(
+                data=silence_data,
+                sample_rate=self.sample_rate,
+                channels=self.channels,
+                chunk_index=self.chunk_index,
+                timestamp=time.time()
+            )
+            self.chunk_index += 1
+            return chunk
+
+
+def audio_stream_source(data: Dict[str, Any], context=None):
+    """
+    Component that generates audio stream chunks using continuous background recording.
+    
+    Input:
+        source: str - audio source type ("sine_wave", "microphone", "system_audio")
+        duration: float - duration in seconds
+        sample_rate: int - sample rate in Hz (will auto-detect if not supported)
+        channels: int - number of audio channels
+        chunk_size: int - size of each chunk in samples
+        frequency: float - frequency for sine wave (if source is sine_wave)
+        output_file: str - path to output WAV file
+        device_name: str - name of audio device to use (e.g., "C922 Pro Stream Webcam")
+        
+    Output:
+        Streaming audio chunks with metadata
+    """
+    global _pipeline
+    
+    # Check if we should use the streaming pipeline
+    use_pipeline = data.get('use_pipeline', False)
+    
+    if use_pipeline and _pipeline is None:
+        # Start the streaming pipeline
+        _pipeline = StreamingPipeline()
+        
+        # Extract configs for each component
+        source_config = {
+            'source': data.get('source', 'microphone'),
+            'sample_rate': data.get('sample_rate', 16000),
+            'channels': data.get('channels', 1),
+            'chunk_size': data.get('chunk_size', 1024),
+            'duration': data.get('duration', 5.0),
+            'device_name': data.get('device_name', None),
+            'frequency': data.get('frequency', 440.0)
+        }
+        
+        processor_config = {
+            'operation': data.get('operation', 'passthrough'),
+            'gain': data.get('gain', 2.0)
+        }
+        
+        sink_config = {
+            'output_file': data.get('output_file', 'output_audio.wav')
+        }
+        
+        # Start the pipeline
+        _pipeline.start_pipeline(source_config, processor_config, sink_config)
+        
+        # Return a simple success response since the pipeline is running
+        return {
+            "outcome": "success",
+            "result": {
+                "message": "Streaming pipeline started",
+                "pipeline_id": str(uuid.uuid4())
+            }
+        }
+    
+    # Fallback to the original implementation for non-pipeline mode
+    import time
+    start_time = time.time()
+    
+    source_type = data.get('source', 'sine_wave')
+    duration = data.get('duration', 5.0)
+    requested_sample_rate = data.get('sample_rate', 44100)
+    channels = data.get('channels', 1)
+    chunk_size = data.get('chunk_size', 1024)
+    frequency = data.get('frequency', 440.0)
+    output_file = data.get('output_file', 'output_audio.wav')
+    device_name = data.get('device_name', None)
+    
+    print(f"TIMING: Starting audio_stream_source at {start_time}", file=sys.stderr)
+    
+    # Initialize PyAudio
+    audio = pyaudio.PyAudio()
+    
+    # Find device if specified
+    device_index = None
+    if device_name:
+        for i in range(audio.get_device_count()):
+            info = audio.get_device_info_by_index(i)
+            if device_name.lower() in info['name'].lower():
+                device_index = i
+                print(f"Found device: {info['name']} (index {i})", file=sys.stderr)
+                break
+    
+    # Auto-detect sample rate if device is specified
+    sample_rate = requested_sample_rate
+    if device_index is not None:
+        sample_rates = [16000, 22050, 44100, 48000]
+        for rate in sample_rates:
+            try:
+                test_stream = audio.open(format=pyaudio.paInt16,
+                                        channels=channels,
+                                        rate=rate,
+                                        input=True,
+                                        input_device_index=device_index,
+                                        frames_per_buffer=chunk_size)
+                test_stream.close()
+                sample_rate = rate
+                print(f"Using sample rate: {sample_rate} Hz for device", file=sys.stderr)
+                break
+            except OSError:
+                continue
+    
+    # Calculate how many chunks we need for the full duration
+    chunk_duration = chunk_size / sample_rate  # seconds per chunk
+    total_chunks = int(duration / chunk_duration)
+    
+    print(f"DEBUG: Generating {total_chunks} chunks for {duration}s audio at {sample_rate}Hz", file=sys.stderr)
+    print(f"DEBUG: chunk_duration={chunk_duration}s, chunk_size={chunk_size} samples", file=sys.stderr)
+    
+    # Collect all chunks for direct WAV file writing
+    all_chunks = []
+    
+    if source_type == 'microphone':
+        # Set up continuous recording with queue
+        audio_queue = queue.Queue()
+        recording_stop = threading.Event()
+        
+        def record_audio_continuously():
+            """Background thread that continuously records audio."""
+            try:
+                if device_index is not None:
+                    stream = audio.open(
+                        format=pyaudio.paInt16,
+                        channels=channels,
+                        rate=sample_rate,
+                        input=True,
+                        input_device_index=device_index,
+                        frames_per_buffer=chunk_size
+                    )
+                else:
+                    stream = audio.open(
+                        format=pyaudio.paInt16,
+                        channels=channels,
+                        rate=sample_rate,
+                        input=True,
+                        frames_per_buffer=chunk_size
+                    )
+                
+                print(f"Started continuous recording from device {device_index}", file=sys.stderr)
+                
+                chunk_index = 0
+                while not recording_stop.is_set() and chunk_index < total_chunks:
+                    try:
+                        data = stream.read(chunk_size, exception_on_overflow=False)
+                        audio_queue.put((chunk_index, data))
+                        chunk_index += 1
+                    except Exception as e:
+                        print(f"Recording error: {e}", file=sys.stderr)
+                        break
+                
+                stream.stop_stream()
+                stream.close()
+                print(f"Recording thread completed after {chunk_index} chunks", file=sys.stderr)
+                
+            except Exception as e:
+                print(f"Failed to start recording: {e}", file=sys.stderr)
+        
+        # Start recording thread
+        recording_thread = threading.Thread(target=record_audio_continuously, daemon=True)
+        recording_thread.start()
+        
+        print(f"DEBUG: Started continuous recording thread", file=sys.stderr)
+        
+        # Stream chunks as they become available
+        for chunk_index in range(total_chunks):
+            chunk_start_time = time.time()
+            print(f"TIMING: Waiting for chunk {chunk_index}/{total_chunks-1} at {chunk_start_time}", file=sys.stderr)
+            
+            try:
+                # Wait for chunk from recording thread (with timeout)
+                received_index, chunk_data = audio_queue.get(timeout=5.0)  # 5 second timeout
+                
+                if received_index != chunk_index:
+                    print(f"WARNING: Expected chunk {chunk_index} but got {received_index}", file=sys.stderr)
+                
+                audio_capture_time = time.time()
+                print(f"TIMING: Got chunk {chunk_index} from queue in {audio_capture_time - chunk_start_time:.4f}s", file=sys.stderr)
+                
+            except queue.Empty:
+                print(f"ERROR: Timeout waiting for chunk {chunk_index}", file=sys.stderr)
+                # Generate silence as fallback
+                chunk_data = b'\x00' * (chunk_size * 2)  # 16-bit = 2 bytes per sample
+            
+            # Store chunk for WAV file writing
+            all_chunks.append(chunk_data)
+            
+            chunk_b64 = base64.b64encode(chunk_data).decode('utf-8')
+            is_final = chunk_index >= total_chunks - 1
+            
+            encoding_time = time.time()
+            print(f"TIMING: Base64 encoding took {encoding_time - audio_capture_time:.4f}s", file=sys.stderr)
+            
+            print(f"DEBUG: Yielding chunk {chunk_index}/{total_chunks-1}, is_final={is_final}", file=sys.stderr)
+            
+            yield {
+                "outcome": "streaming",
+                "stream_id": str(uuid.uuid4()),
+                "sample_rate": sample_rate,
+                "channels": channels,
+                "chunk_size": len(chunk_data),
+                "format": "pcm_16bit",
+                "chunk": chunk_b64,
+                "chunk_index": chunk_index,
+                "is_final": is_final
+            }
+            
+            chunk_end_time = time.time()
+            print(f"TIMING: Total chunk {chunk_index} processing took {chunk_end_time - chunk_start_time:.4f}s", file=sys.stderr)
+        
+        # Stop recording
+        recording_stop.set()
+        recording_thread.join(timeout=2.0)
+        
+    elif source_type == 'system_audio':
+        # Similar implementation for system audio
+        try:
+            source = AudioStreamSource(sample_rate, channels, chunk_size)
+            source.start_system_audio_stream()
+            
+            for chunk_index in range(total_chunks):
+                chunk_start_time = time.time()
+                chunk = source.get_system_audio_chunk()
+                
+                audio_capture_time = time.time()
+                print(f"TIMING: System audio capture took {audio_capture_time - chunk_start_time:.4f}s", file=sys.stderr)
+                
+                all_chunks.append(chunk.data)
+                chunk_b64 = base64.b64encode(chunk.data).decode('utf-8')
+                is_final = chunk_index >= total_chunks - 1
+                
+                yield {
+                    "outcome": "streaming",
+                    "stream_id": chunk.stream_id,
+                    "sample_rate": chunk.sample_rate,
+                    "channels": chunk.channels,
+                    "chunk_size": len(chunk.data),
+                    "format": "pcm_16bit",
+                    "chunk": chunk_b64,
+                    "chunk_index": chunk_index,
+                    "is_final": is_final
+                }
+        except Exception as e:
+            print(f"System audio capture failed: {e}. Falling back to sine wave.", file=sys.stderr)
+            source_type = 'sine_wave'
+    
+    if source_type == 'sine_wave':
+        # Generate sine wave chunks (no queue needed)
+        source = AudioStreamSource(sample_rate, channels, chunk_size)
+        
+        for chunk_index in range(total_chunks):
+            chunk_start_time = time.time()
+            chunk = source.generate_sine_wave_chunk(frequency, chunk_duration)
+            
+            audio_capture_time = time.time()
+            print(f"TIMING: Sine wave generation took {audio_capture_time - chunk_start_time:.4f}s", file=sys.stderr)
+            
+            all_chunks.append(chunk.data)
+            chunk_b64 = base64.b64encode(chunk.data).decode('utf-8')
+            is_final = chunk_index >= total_chunks - 1
+            
+            yield {
+                "outcome": "streaming",
+                "stream_id": chunk.stream_id,
+                "sample_rate": chunk.sample_rate,
+                "channels": chunk.channels,
+                "chunk_size": len(chunk.data),
+                "format": "pcm_16bit",
+                "chunk": chunk_b64,
+                "chunk_index": chunk_index,
+                "is_final": is_final
+            }
+    
+    print(f"DEBUG: Generator loop completed. Processed {len(all_chunks)} chunks.", file=sys.stderr)
+    
+    # Write WAV file directly when streaming completes
+    if all_chunks:
+        try:
+            print(f"DEBUG: Writing WAV file directly: {output_file}", file=sys.stderr)
+            all_audio_data = b''.join(all_chunks)
+            
+            with wave.open(output_file, 'wb') as wav_file:
+                wav_file.setnchannels(channels)
+                wav_file.setsampwidth(2)  # 16-bit
+                wav_file.setframerate(sample_rate)
+                wav_file.writeframes(all_audio_data)
+            
+            print(f"DEBUG: WAV file written successfully: {output_file} ({len(all_audio_data)} bytes)", file=sys.stderr)
+        except Exception as e:
+            print(f"ERROR: Failed to write WAV file {output_file}: {e}", file=sys.stderr)
+    else:
+        print(f"DEBUG: No chunks collected, skipping WAV file write", file=sys.stderr)
+    
+    total_time = time.time() - start_time
+    print(f"TIMING: Total audio_stream_source execution took {total_time:.4f}s", file=sys.stderr)
+
+
+def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
+    """
+    Component that processes PCM 16-bit audio chunks.
+    
+    Input:
+        chunk: str - base64 encoded PCM data
+        chunk_index: int
+        sample_rate: int
+        channels: int
+        operation: str - processing operation ("amplify", "filter", "analyze")
+        
+    Output:
+        Processed chunk or analysis results
+    """
+    import time
+    start_time = time.time()
+    
+    chunk_b64 = data['chunk']
+    chunk_index = data.get('chunk_index', 0)
+    sample_rate = data.get('sample_rate', 16000)
+    channels = data.get('channels', 1)
+    operation = data.get('operation', 'analyze')
+    
+    print(f"TIMING: audio_chunk_processor starting chunk {chunk_index} at {start_time}", file=sys.stderr)
+    
+    # Decode base64 chunk
+    chunk_data = base64.b64decode(chunk_b64)
+    decode_time = time.time()
+    print(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", file=sys.stderr)
+    
+    # Convert bytes to samples
+    samples = []
+    for i in range(0, len(chunk_data), 2):
+        sample = int.from_bytes(chunk_data[i:i+2], 'little', signed=True)
+        samples.append(sample)
+    
+    convert_time = time.time()
+    print(f"TIMING: Sample conversion took {convert_time - decode_time:.4f}s", file=sys.stderr)
+    
+    if operation == "amplify":
+        # Amplify the audio (multiply by gain factor)
+        gain = data.get('gain', 2.0)
+        amplified_samples = [int(sample * gain) for sample in samples]
+        
+        # Convert back to bytes
+        amplified_data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in amplified_samples)
+        amplified_b64 = base64.b64encode(amplified_data).decode('utf-8')
+        
+        process_time = time.time()
+        print(f"TIMING: Amplification processing took {process_time - convert_time:.4f}s", file=sys.stderr)
+        
+        result = {
+            "outcome": "streaming",
+            "stream_id": data.get('stream_id', f"processed_{chunk_index}"),
+            "sample_rate": sample_rate,
+            "channels": channels,
+            "operation": "amplify",
+            "gain": gain,
+            "chunk": amplified_b64,
+            "chunk_index": chunk_index,
+            "is_final": data.get('is_final', False)
+        }
+    
+    elif operation == "analyze":
+        # Analyze the audio chunk
+        if samples:
+            max_amplitude = max(abs(sample) for sample in samples)
+            avg_amplitude = sum(abs(sample) for sample in samples) / len(samples)
+            rms = (sum(sample * sample for sample in samples) / len(samples)) ** 0.5
+        else:
+            max_amplitude = avg_amplitude = rms = 0
+        
+        process_time = time.time()
+        print(f"TIMING: Analysis processing took {process_time - convert_time:.4f}s", file=sys.stderr)
+        
+        result = {
+            "outcome": "success",
+            "result": {
+                "chunk_index": chunk_index,
+                "sample_count": len(samples),
+                "max_amplitude": max_amplitude,
+                "avg_amplitude": avg_amplitude,
+                "rms": rms,
+                "sample_rate": sample_rate,
+                "channels": channels
+            }
+        }
+    
+    else:
+        # Pass through unchanged
+        result = {
+            "outcome": "streaming",
+            "stream_id": data.get('stream_id', f"passthrough_{chunk_index}"),
+            "sample_rate": sample_rate,
+            "channels": channels,
+            "operation": "passthrough",
+            "chunk": chunk_b64,
+            "chunk_index": chunk_index,
+            "is_final": data.get('is_final', False)
+        }
+    
+    total_time = time.time() - start_time
+    print(f"TIMING: audio_chunk_processor total time for chunk {chunk_index}: {total_time:.4f}s", file=sys.stderr)
+    
+    return result
+
+
+def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
+    """
+    Component that receives and processes audio chunks (sink).
+    
+    Input:
+        chunk: str - base64 encoded PCM data
+        chunk_index: int
+        stream_id: str
+        output_file: str (optional) - path to output WAV file
+        play_audio: bool (optional) - whether to play audio in real time
+        
+    Output:
+        Confirmation of chunk received and file written
+    """
+    import time
+    start_time = time.time()
+    
+    chunk_b64 = data.get('chunk', '')
+    chunk_index = data.get('chunk_index', 0)
+    stream_id = data.get('stream_id', 'unknown')
+    output_file = data.get('output_file', 'output_audio.wav')
+    play_audio = data.get('play_audio', False)
+    
+    print(f"TIMING: audio_sink starting chunk {chunk_index} at {start_time}", file=sys.stderr)
+    
+    # Decode the chunk
+    if chunk_b64:
+        chunk_data = base64.b64decode(chunk_b64)
+        decode_time = time.time()
+        print(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", file=sys.stderr)
+        
+        # Convert to samples for analysis
+        samples = []
+        for i in range(0, len(chunk_data), 2):
+            sample = int.from_bytes(chunk_data[i:i+2], 'little', signed=True)
+            samples.append(sample)
+        
+        # Calculate audio levels
+        if samples:
+            max_amplitude = max(abs(sample) for sample in samples)
+            avg_amplitude = sum(abs(sample) for sample in samples) / len(samples)
+            rms = (sum(sample * sample for sample in samples) / len(samples)) ** 0.5
+        else:
+            max_amplitude = avg_amplitude = rms = 0
+        
+        analysis_time = time.time()
+        print(f"TIMING: Audio analysis took {analysis_time - decode_time:.4f}s", file=sys.stderr)
+        
+        # Play audio if requested
+        if play_audio:
+            try:
+                import sounddevice as sd
+                import numpy as np
+                
+                # Convert to numpy array
+                audio_array = np.array(samples, dtype=np.int16)
+                
+                # Play the audio
+                sd.play(audio_array, samplerate=data.get('sample_rate', 16000))
+                sd.wait()
+                
+                play_time = time.time()
+                print(f"TIMING: Audio playback took {play_time - analysis_time:.4f}s", file=sys.stderr)
+                
+            except ImportError:
+                print("WARNING: sounddevice not available, skipping audio playback", file=sys.stderr)
+            except Exception as e:
+                print(f"ERROR: Audio playback failed: {e}", file=sys.stderr)
+        
+        result = {
+            "outcome": "success",
+            "result": {
+                "chunk_index": chunk_index,
+                "stream_id": stream_id,
+                "max_amplitude": max_amplitude,
+                "avg_amplitude": avg_amplitude,
+                "rms": rms,
+                "sample_count": len(samples),
+                "chunk_size_bytes": len(chunk_data),
+                "output_file": output_file
+            }
+        }
+    else:
+        result = {
+            "outcome": "success",
+            "result": {
+                "chunk_index": chunk_index,
+                "stream_id": stream_id,
+                "message": "No audio data received"
+            }
+        }
+    
+    total_time = time.time() - start_time
+    print(f"TIMING: audio_sink total time for chunk {chunk_index}: {total_time:.4f}s", file=sys.stderr)
+    
+    return result 
\ No newline at end of file
diff --git a/sdks/python/src/stepflow_sdk/main.py b/sdks/python/src/stepflow_sdk/main.py
index 3950ee68..99010e13 100644
--- a/sdks/python/src/stepflow_sdk/main.py
+++ b/sdks/python/src/stepflow_sdk/main.py
@@ -4,6 +4,7 @@
 from typing import Any, List
 from stepflow_sdk.server import StepflowStdioServer
 from stepflow_sdk.context import StepflowContext
+from stepflow_sdk.audio_components import audio_stream_source, audio_chunk_processor, audio_sink
 
 # Create server instance
 server = StepflowStdioServer()
@@ -508,6 +509,11 @@ async def wrapper(data):
             except Exception as e:
                 raise ValueError(f"Code compilation failed: {e}")
 
+# Register audio components
+server.component(name="audio_stream_source")(audio_stream_source)
+server.component(name="audio_chunk_processor")(audio_chunk_processor)
+server.component(name="audio_sink")(audio_sink)
+
 def main():
     # Start the server
     server.run()
diff --git a/sdks/python/src/stepflow_sdk/server.py b/sdks/python/src/stepflow_sdk/server.py
index 0105d8c6..b49b7d59 100644
--- a/sdks/python/src/stepflow_sdk/server.py
+++ b/sdks/python/src/stepflow_sdk/server.py
@@ -67,6 +67,9 @@ def decorator(f: Callable) -> Callable:
             # Extract description from parameter or docstring
             component_description = description or (f.__doc__.strip() if f.__doc__ else None)
             
+            # Check if this is a generator function
+            is_generator = inspect.isgeneratorfunction(f)
+            
             self._components[component_name] = ComponentEntry(
                 name=component_name,
                 function=f,
@@ -75,8 +78,9 @@ def decorator(f: Callable) -> Callable:
                 description=component_description
             )
             
-            # Store whether function expects context
+            # Store whether function expects context and is a generator
             f._expects_context = expects_context
+            f._is_generator = is_generator
 
             @wraps(f)
             def wrapper(*args, **kwargs):
@@ -130,8 +134,10 @@ async def _handle_method_request(self, request: Message) -> Message | None:
                 )
             case "component_execute":
                 execute_request = msgspec.json.decode(request.params, type=ComponentExecuteRequest)
+                print(f"DEBUG: Executing component: {execute_request.component}", file=sys.stderr)
                 component = self.get_component(execute_request.component)
                 if not component:
+                    print(f"DEBUG: Component {execute_request.component} not found!", file=sys.stderr)
                     return Message(
                         id=id,
                         error={
@@ -140,29 +146,57 @@ async def _handle_method_request(self, request: Message) -> Message | None:
                             "data": None
                         }
                     )
+                print(f"DEBUG: Component found, executing function", file=sys.stderr)
                 try:
                     # Parse input parameters into the expected type
                     input = msgspec.json.decode(execute_request.input, type=component.input_type)
+                    print(f"DEBUG: Input parsed successfully: {input}", file=sys.stderr)
                     
-                    # Execute component with or without context
-                    import asyncio
-                    import inspect
+                    # Execute the component function
+                    output = component.function(input)
+                    print(f"DEBUG: Component function executed, output type: {type(output)}", file=sys.stderr)
                     
-                    if hasattr(component.function, '_expects_context') and component.function._expects_context:
-                        if inspect.iscoroutinefunction(component.function):
-                            output = await component.function(input, self._context)
+                    # Check if this is a generator function
+                    if hasattr(component.function, '_is_generator') and component.function._is_generator:
+                        # For generators, we need to yield each result as streaming
+                        if inspect.isgenerator(output):
+                            results = []
+                            for result in output:
+                                results.append(result)
+                                # Send streaming notification
+                                await self._outgoing_queue.put({
+                                    "jsonrpc": "2.0",
+                                    "method": "streaming_chunk",
+                                    "params": {
+                                        "request_id": str(id),
+                                        "chunk": result
+                                    }
+                                })
+                            
+                            # Return the final result (last chunk)
+                            if results:
+                                return Message(
+                                    id=id,
+                                    result=ComponentExecuteResponse(output=results[-1]),
+                                )
+                            else:
+                                # Empty generator
+                                return Message(
+                                    id=id,
+                                    result=ComponentExecuteResponse(output={"outcome": "success", "result": None}),
+                                )
                         else:
-                            output = component.function(input, self._context)
+                            # Not actually a generator, treat as normal
+                            return Message(
+                                id=id,
+                                result=ComponentExecuteResponse(output=output),
+                            )
                     else:
-                        if inspect.iscoroutinefunction(component.function):
-                            output = await component.function(input)
-                        else:
-                            output = component.function(input)
-                        
-                    return Message(
-                        id=id,
-                        result=ComponentExecuteResponse(output=output),
-                    )
+                        # Normal non-generator function
+                        return Message(
+                            id=id,
+                            result=ComponentExecuteResponse(output=output),
+                        )
                 except Exception as e:
                     return Message(
                         id=id,
diff --git a/sdks/python/uv.lock b/sdks/python/uv.lock
index 9c368820..34640d06 100644
--- a/sdks/python/uv.lock
+++ b/sdks/python/uv.lock
@@ -10,6 +10,28 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/77/06/bb80f5f86020c4551da315d78b3ab75e8228f89f0162f2c3a819e407941a/attrs-25.3.0-py3-none-any.whl", hash = "sha256:427318ce031701fea540783410126f03899a97ffc6f61596ad581ac2e40e3bc3", size = 63815 },
 ]
 
+[[package]]
+name = "cffi"
+version = "1.17.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pycparser" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/fc/97/c783634659c2920c3fc70419e3af40972dbaf758daa229a7d6ea6135c90d/cffi-1.17.1.tar.gz", hash = "sha256:1c39c6016c32bc48dd54561950ebd6836e1670f2ae46128f67cf49e789c52824", size = 516621 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/8d/f8/dd6c246b148639254dad4d6803eb6a54e8c85c6e11ec9df2cffa87571dbe/cffi-1.17.1-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:f3a2b4222ce6b60e2e8b337bb9596923045681d71e5a082783484d845390938e", size = 182989 },
+    { url = "https://files.pythonhosted.org/packages/8b/f1/672d303ddf17c24fc83afd712316fda78dc6fce1cd53011b839483e1ecc8/cffi-1.17.1-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:0984a4925a435b1da406122d4d7968dd861c1385afe3b45ba82b750f229811e2", size = 178802 },
+    { url = "https://files.pythonhosted.org/packages/0e/2d/eab2e858a91fdff70533cab61dcff4a1f55ec60425832ddfdc9cd36bc8af/cffi-1.17.1-cp313-cp313-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:d01b12eeeb4427d3110de311e1774046ad344f5b1a7403101878976ecd7a10f3", size = 454792 },
+    { url = "https://files.pythonhosted.org/packages/75/b2/fbaec7c4455c604e29388d55599b99ebcc250a60050610fadde58932b7ee/cffi-1.17.1-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:706510fe141c86a69c8ddc029c7910003a17353970cff3b904ff0686a5927683", size = 478893 },
+    { url = "https://files.pythonhosted.org/packages/4f/b7/6e4a2162178bf1935c336d4da8a9352cccab4d3a5d7914065490f08c0690/cffi-1.17.1-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:de55b766c7aa2e2a3092c51e0483d700341182f08e67c63630d5b6f200bb28e5", size = 485810 },
+    { url = "https://files.pythonhosted.org/packages/c7/8a/1d0e4a9c26e54746dc08c2c6c037889124d4f59dffd853a659fa545f1b40/cffi-1.17.1-cp313-cp313-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:c59d6e989d07460165cc5ad3c61f9fd8f1b4796eacbd81cee78957842b834af4", size = 471200 },
+    { url = "https://files.pythonhosted.org/packages/26/9f/1aab65a6c0db35f43c4d1b4f580e8df53914310afc10ae0397d29d697af4/cffi-1.17.1-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:dd398dbc6773384a17fe0d3e7eeb8d1a21c2200473ee6806bb5e6a8e62bb73dd", size = 479447 },
+    { url = "https://files.pythonhosted.org/packages/5f/e4/fb8b3dd8dc0e98edf1135ff067ae070bb32ef9d509d6cb0f538cd6f7483f/cffi-1.17.1-cp313-cp313-musllinux_1_1_aarch64.whl", hash = "sha256:3edc8d958eb099c634dace3c7e16560ae474aa3803a5df240542b305d14e14ed", size = 484358 },
+    { url = "https://files.pythonhosted.org/packages/f1/47/d7145bf2dc04684935d57d67dff9d6d795b2ba2796806bb109864be3a151/cffi-1.17.1-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:72e72408cad3d5419375fc87d289076ee319835bdfa2caad331e377589aebba9", size = 488469 },
+    { url = "https://files.pythonhosted.org/packages/bf/ee/f94057fa6426481d663b88637a9a10e859e492c73d0384514a17d78ee205/cffi-1.17.1-cp313-cp313-win32.whl", hash = "sha256:e03eab0a8677fa80d646b5ddece1cbeaf556c313dcfac435ba11f107ba117b5d", size = 172475 },
+    { url = "https://files.pythonhosted.org/packages/7c/fc/6a8cb64e5f0324877d503c854da15d76c1e50eb722e320b15345c4d0c6de/cffi-1.17.1-cp313-cp313-win_amd64.whl", hash = "sha256:f6a16c31041f09ead72d69f583767292f750d24913dadacf5756b966aacb3f1a", size = 182009 },
+]
+
 [[package]]
 name = "colorama"
 version = "0.4.6"
@@ -99,6 +121,36 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/23/d8/f15b40611c2d5753d1abb0ca0da0c75348daf1252220e5dda2867bd81062/msgspec-0.19.0-cp313-cp313-win_amd64.whl", hash = "sha256:317050bc0f7739cb30d257ff09152ca309bf5a369854bbf1e57dffc310c1f20f", size = 187432 },
 ]
 
+[[package]]
+name = "numpy"
+version = "2.3.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/2e/19/d7c972dfe90a353dbd3efbbe1d14a5951de80c99c9dc1b93cd998d51dc0f/numpy-2.3.1.tar.gz", hash = "sha256:1ec9ae20a4226da374362cca3c62cd753faf2f951440b0e3b98e93c235441d2b", size = 20390372 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/d4/bd/35ad97006d8abff8631293f8ea6adf07b0108ce6fec68da3c3fcca1197f2/numpy-2.3.1-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:25a1992b0a3fdcdaec9f552ef10d8103186f5397ab45e2d25f8ac51b1a6b97e8", size = 20889381 },
+    { url = "https://files.pythonhosted.org/packages/f1/4f/df5923874d8095b6062495b39729178eef4a922119cee32a12ee1bd4664c/numpy-2.3.1-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:7dea630156d39b02a63c18f508f85010230409db5b2927ba59c8ba4ab3e8272e", size = 14152726 },
+    { url = "https://files.pythonhosted.org/packages/8c/0f/a1f269b125806212a876f7efb049b06c6f8772cf0121139f97774cd95626/numpy-2.3.1-cp313-cp313-macosx_14_0_arm64.whl", hash = "sha256:bada6058dd886061f10ea15f230ccf7dfff40572e99fef440a4a857c8728c9c0", size = 5105145 },
+    { url = "https://files.pythonhosted.org/packages/6d/63/a7f7fd5f375b0361682f6ffbf686787e82b7bbd561268e4f30afad2bb3c0/numpy-2.3.1-cp313-cp313-macosx_14_0_x86_64.whl", hash = "sha256:a894f3816eb17b29e4783e5873f92faf55b710c2519e5c351767c51f79d8526d", size = 6639409 },
+    { url = "https://files.pythonhosted.org/packages/bf/0d/1854a4121af895aab383f4aa233748f1df4671ef331d898e32426756a8a6/numpy-2.3.1-cp313-cp313-manylinux_2_28_aarch64.whl", hash = "sha256:18703df6c4a4fee55fd3d6e5a253d01c5d33a295409b03fda0c86b3ca2ff41a1", size = 14257630 },
+    { url = "https://files.pythonhosted.org/packages/50/30/af1b277b443f2fb08acf1c55ce9d68ee540043f158630d62cef012750f9f/numpy-2.3.1-cp313-cp313-manylinux_2_28_x86_64.whl", hash = "sha256:5902660491bd7a48b2ec16c23ccb9124b8abfd9583c5fdfa123fe6b421e03de1", size = 16627546 },
+    { url = "https://files.pythonhosted.org/packages/6e/ec/3b68220c277e463095342d254c61be8144c31208db18d3fd8ef02712bcd6/numpy-2.3.1-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:36890eb9e9d2081137bd78d29050ba63b8dab95dff7912eadf1185e80074b2a0", size = 15562538 },
+    { url = "https://files.pythonhosted.org/packages/77/2b/4014f2bcc4404484021c74d4c5ee8eb3de7e3f7ac75f06672f8dcf85140a/numpy-2.3.1-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:a780033466159c2270531e2b8ac063704592a0bc62ec4a1b991c7c40705eb0e8", size = 18360327 },
+    { url = "https://files.pythonhosted.org/packages/40/8d/2ddd6c9b30fcf920837b8672f6c65590c7d92e43084c25fc65edc22e93ca/numpy-2.3.1-cp313-cp313-win32.whl", hash = "sha256:39bff12c076812595c3a306f22bfe49919c5513aa1e0e70fac756a0be7c2a2b8", size = 6312330 },
+    { url = "https://files.pythonhosted.org/packages/dd/c8/beaba449925988d415efccb45bf977ff8327a02f655090627318f6398c7b/numpy-2.3.1-cp313-cp313-win_amd64.whl", hash = "sha256:8d5ee6eec45f08ce507a6570e06f2f879b374a552087a4179ea7838edbcbfa42", size = 12731565 },
+    { url = "https://files.pythonhosted.org/packages/0b/c3/5c0c575d7ec78c1126998071f58facfc124006635da75b090805e642c62e/numpy-2.3.1-cp313-cp313-win_arm64.whl", hash = "sha256:0c4d9e0a8368db90f93bd192bfa771ace63137c3488d198ee21dfb8e7771916e", size = 10190262 },
+    { url = "https://files.pythonhosted.org/packages/ea/19/a029cd335cf72f79d2644dcfc22d90f09caa86265cbbde3b5702ccef6890/numpy-2.3.1-cp313-cp313t-macosx_10_13_x86_64.whl", hash = "sha256:b0b5397374f32ec0649dd98c652a1798192042e715df918c20672c62fb52d4b8", size = 20987593 },
+    { url = "https://files.pythonhosted.org/packages/25/91/8ea8894406209107d9ce19b66314194675d31761fe2cb3c84fe2eeae2f37/numpy-2.3.1-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:c5bdf2015ccfcee8253fb8be695516ac4457c743473a43290fd36eba6a1777eb", size = 14300523 },
+    { url = "https://files.pythonhosted.org/packages/a6/7f/06187b0066eefc9e7ce77d5f2ddb4e314a55220ad62dd0bfc9f2c44bac14/numpy-2.3.1-cp313-cp313t-macosx_14_0_arm64.whl", hash = "sha256:d70f20df7f08b90a2062c1f07737dd340adccf2068d0f1b9b3d56e2038979fee", size = 5227993 },
+    { url = "https://files.pythonhosted.org/packages/e8/ec/a926c293c605fa75e9cfb09f1e4840098ed46d2edaa6e2152ee35dc01ed3/numpy-2.3.1-cp313-cp313t-macosx_14_0_x86_64.whl", hash = "sha256:2fb86b7e58f9ac50e1e9dd1290154107e47d1eef23a0ae9145ded06ea606f992", size = 6736652 },
+    { url = "https://files.pythonhosted.org/packages/e3/62/d68e52fb6fde5586650d4c0ce0b05ff3a48ad4df4ffd1b8866479d1d671d/numpy-2.3.1-cp313-cp313t-manylinux_2_28_aarch64.whl", hash = "sha256:23ab05b2d241f76cb883ce8b9a93a680752fbfcbd51c50eff0b88b979e471d8c", size = 14331561 },
+    { url = "https://files.pythonhosted.org/packages/fc/ec/b74d3f2430960044bdad6900d9f5edc2dc0fb8bf5a0be0f65287bf2cbe27/numpy-2.3.1-cp313-cp313t-manylinux_2_28_x86_64.whl", hash = "sha256:ce2ce9e5de4703a673e705183f64fd5da5bf36e7beddcb63a25ee2286e71ca48", size = 16693349 },
+    { url = "https://files.pythonhosted.org/packages/0d/15/def96774b9d7eb198ddadfcbd20281b20ebb510580419197e225f5c55c3e/numpy-2.3.1-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:c4913079974eeb5c16ccfd2b1f09354b8fed7e0d6f2cab933104a09a6419b1ee", size = 15642053 },
+    { url = "https://files.pythonhosted.org/packages/2b/57/c3203974762a759540c6ae71d0ea2341c1fa41d84e4971a8e76d7141678a/numpy-2.3.1-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:010ce9b4f00d5c036053ca684c77441f2f2c934fd23bee058b4d6f196efd8280", size = 18434184 },
+    { url = "https://files.pythonhosted.org/packages/22/8a/ccdf201457ed8ac6245187850aff4ca56a79edbea4829f4e9f14d46fa9a5/numpy-2.3.1-cp313-cp313t-win32.whl", hash = "sha256:6269b9edfe32912584ec496d91b00b6d34282ca1d07eb10e82dfc780907d6c2e", size = 6440678 },
+    { url = "https://files.pythonhosted.org/packages/f1/7e/7f431d8bd8eb7e03d79294aed238b1b0b174b3148570d03a8a8a8f6a0da9/numpy-2.3.1-cp313-cp313t-win_amd64.whl", hash = "sha256:2a809637460e88a113e186e87f228d74ae2852a2e0c44de275263376f17b5bdc", size = 12870697 },
+    { url = "https://files.pythonhosted.org/packages/d4/ca/af82bf0fad4c3e573c6930ed743b5308492ff19917c7caaf2f9b6f9e2e98/numpy-2.3.1-cp313-cp313t-win_arm64.whl", hash = "sha256:eccb9a159db9aed60800187bc47a6d3451553f0e1b08b068d8b277ddfbb9b244", size = 10260376 },
+]
+
 [[package]]
 name = "packaging"
 version = "25.0"
@@ -117,6 +169,25 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/88/5f/e351af9a41f866ac3f1fac4ca0613908d9a41741cfcf2228f4ad853b697d/pluggy-1.5.0-py3-none-any.whl", hash = "sha256:44e1ad92c8ca002de6377e165f3e0f1be63266ab4d554740532335b9d75ea669", size = 20556 },
 ]
 
+[[package]]
+name = "pyaudio"
+version = "0.2.14"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/26/1d/8878c7752febb0f6716a7e1a52cb92ac98871c5aa522cba181878091607c/PyAudio-0.2.14.tar.gz", hash = "sha256:78dfff3879b4994d1f4fc6485646a57755c6ee3c19647a491f790a0895bd2f87", size = 47066 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/3a/77/66cd37111a87c1589b63524f3d3c848011d21ca97828422c7fde7665ff0d/PyAudio-0.2.14-cp313-cp313-win32.whl", hash = "sha256:95328285b4dab57ea8c52a4a996cb52be6d629353315be5bfda403d15932a497", size = 150982 },
+    { url = "https://files.pythonhosted.org/packages/a5/8b/7f9a061c1cc2b230f9ac02a6003fcd14c85ce1828013aecbaf45aa988d20/PyAudio-0.2.14-cp313-cp313-win_amd64.whl", hash = "sha256:692d8c1446f52ed2662120bcd9ddcb5aa2b71f38bda31e58b19fb4672fffba69", size = 173655 },
+]
+
+[[package]]
+name = "pycparser"
+version = "2.22"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/1d/b2/31537cf4b1ca988837256c910a668b553fceb8f069bedc4b1c826024b52c/pycparser-2.22.tar.gz", hash = "sha256:491c8be9c040f5390f5bf44a5b07752bd07f56edf992381b05c701439eec10f6", size = 172736 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/13/a3/a812df4e2dd5696d1f351d58b8fe16a405b234ad2886a0dab9183fb78109/pycparser-2.22-py3-none-any.whl", hash = "sha256:c3702b6d3dd8c7abc1afa565d7e63d53a1d0bd86cdc24edd75470f4de499cfcc", size = 117552 },
+]
+
 [[package]]
 name = "pytest"
 version = "8.3.5"
@@ -205,6 +276,21 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/b6/97/5a4b59697111c89477d20ba8a44df9ca16b41e737fa569d5ae8bff99e650/rpds_py-0.25.1-cp313-cp313t-win_amd64.whl", hash = "sha256:401ca1c4a20cc0510d3435d89c069fe0a9ae2ee6495135ac46bdd49ec0495763", size = 232218 },
 ]
 
+[[package]]
+name = "sounddevice"
+version = "0.5.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "cffi" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/91/a6/91e9f08ed37c7c9f56b5227c6aea7f2ae63ba2d59520eefb24e82cbdd589/sounddevice-0.5.2.tar.gz", hash = "sha256:c634d51bd4e922d6f0fa5e1a975cc897c947f61d31da9f79ba7ea34dff448b49", size = 53150 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/75/2d/582738fc01352a5bc20acac9221e58538365cecb3bb264838f66419df219/sounddevice-0.5.2-py3-none-any.whl", hash = "sha256:82375859fac2e73295a4ab3fc60bd4782743157adc339561c1f1142af472f505", size = 32450 },
+    { url = "https://files.pythonhosted.org/packages/3f/6f/e3dd751face4fcb5be25e8abba22f25d8e6457ebd7e9ed79068b768dc0e5/sounddevice-0.5.2-py3-none-macosx_10_6_x86_64.macosx_10_6_universal2.whl", hash = "sha256:943f27e66037d41435bdd0293454072cdf657b594c9cde63cd01ee3daaac7ab3", size = 108088 },
+    { url = "https://files.pythonhosted.org/packages/45/0b/bfad79af0b380aa7c0bfe73e4b03e0af45354a48ad62549489bd7696c5b0/sounddevice-0.5.2-py3-none-win32.whl", hash = "sha256:3a113ce614a2c557f14737cb20123ae6298c91fc9301eb014ada0cba6d248c5f", size = 312665 },
+    { url = "https://files.pythonhosted.org/packages/e1/3e/61d88e6b0a7383127cdc779195cb9d83ebcf11d39bc961de5777e457075e/sounddevice-0.5.2-py3-none-win_amd64.whl", hash = "sha256:e18944b767d2dac3771a7771bdd7ff7d3acd7d334e72c4bedab17d1aed5dbc22", size = 363808 },
+]
+
 [[package]]
 name = "stepflow-sdk"
 version = "0.1.0"
@@ -212,6 +298,9 @@ source = { editable = "." }
 dependencies = [
     { name = "jsonschema" },
     { name = "msgspec" },
+    { name = "numpy" },
+    { name = "pyaudio" },
+    { name = "sounddevice" },
 ]
 
 [package.dev-dependencies]
@@ -225,6 +314,9 @@ dev = [
 requires-dist = [
     { name = "jsonschema", specifier = ">=4.17.0" },
     { name = "msgspec", specifier = ">=0.19.0" },
+    { name = "numpy" },
+    { name = "pyaudio", specifier = ">=0.2.11" },
+    { name = "sounddevice" },
 ]
 
 [package.metadata.requires-dev]

From 477cbe85b5f7f84458a579f49c735827481275ff Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Tue, 24 Jun 2025 11:19:16 -0400
Subject: [PATCH 02/14] rust coordination

---
 .../src/workflow_executor.rs                  | 180 ++++++++++++++++--
 crates/stepflow-protocol/src/blob_handlers.rs |   3 +-
 .../src/sqlite_state_store.rs                 |  42 +++-
 crates/stepflow-state/src/in_memory.rs        |  48 +++--
 crates/stepflow-state/src/state_store.rs      |  14 ++
 examples/audio_input.json                     |   7 +-
 examples/test_audio_pipeline.sh               |  44 +----
 .../src/stepflow_sdk/audio_components.py      |   4 +-
 8 files changed, 260 insertions(+), 82 deletions(-)

diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index 18633665..b3eb1ea2 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -83,6 +83,29 @@ impl WorkflowExecutor {
         // Create execution context
         let context = executor.execution_context(execution_id);
 
+        // Initialize streaming coordinator if workflow has streaming steps
+        let streaming_coordinator = if flow.steps.iter().any(|step| step.streaming) {
+            let pipeline_steps: Vec<usize> = flow.steps.iter()
+                .enumerate()
+                .filter(|(_, step)| step.streaming)
+                .map(|(index, _)| index)
+                .collect();
+            
+            if !pipeline_steps.is_empty() {
+                let coordinator = StreamingPipelineCoordinator::new(
+                    executor.clone(),
+                    flow.clone(),
+                    pipeline_steps,
+                    context.clone(),
+                );
+                Some(std::sync::Arc::new(tokio::sync::Mutex::new(coordinator)))
+            } else {
+                None
+            }
+        } else {
+            None
+        };
+
         Ok(Self {
             tracker,
             resolver,
@@ -90,7 +113,7 @@ impl WorkflowExecutor {
             executor,
             flow,
             context,
-            streaming_coordinator: None,
+            streaming_coordinator,
         })
     }
 
@@ -725,6 +748,7 @@ impl WorkflowExecutor {
         // Create a streaming coordinator and store it
         let coordinator = std::sync::Arc::new(tokio::sync::Mutex::new(StreamingPipelineCoordinator::new(
             self.executor.clone(),
+            self.flow.clone(),
             pipeline_steps,
             self.context.clone(),
         )));
@@ -853,18 +877,70 @@ impl WorkflowExecutor {
     pub async fn route_streaming_chunk(&mut self, chunk: serde_json::Value) -> Result<()> {
         tracing::debug!("Routing streaming chunk to workflow executor");
         
-        // For now, we'll just log the chunk
-        // In a full implementation, this would route the chunk to the appropriate streaming step
-        tracing::info!("Received streaming chunk: {:?}", chunk);
+        // Parse the chunk to extract request_id and chunk data
+        let chunk_data = match serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk.clone()) {
+            Ok(data) => data,
+            Err(e) => {
+                tracing::error!("Failed to parse streaming chunk: {}", e);
+                return Ok(());
+            }
+        };
+        
+        // Extract request_id and chunk content
+        let request_id = chunk_data.get("request_id")
+            .and_then(|v| v.as_str())
+            .unwrap_or("unknown");
+        
+        let chunk_content = chunk_data.get("chunk")
+            .cloned()
+            .unwrap_or(serde_json::Value::Null);
+        
+        tracing::debug!("Routing chunk for request {}: {:?}", request_id, chunk_content);
+        
+        // Find streaming steps that are currently active
+        let streaming_steps = self.find_active_streaming_steps().await?;
         
-        // TODO: Implement proper chunk routing to streaming steps
-        // This would involve:
-        // 1. Finding which streaming step should receive this chunk
-        // 2. Sending it through the appropriate channel
-        // 3. Triggering the step to process the chunk
+        if streaming_steps.is_empty() {
+            tracing::warn!("No active streaming steps found for chunk routing");
+            return Ok(());
+        }
+        
+        // Route the chunk to the first streaming step (source step)
+        // In a more sophisticated implementation, we'd route based on stream_id
+        if let Some(first_step_index) = streaming_steps.first() {
+            if let Some(coordinator) = &self.streaming_coordinator {
+                let mut coordinator = coordinator.lock().await;
+                coordinator.route_chunk_to_step(*first_step_index, chunk_content).await?;
+                tracing::debug!("Routed chunk to streaming step {}", first_step_index);
+            }
+        }
         
         Ok(())
     }
+    
+    /// Find currently active streaming steps
+    async fn find_active_streaming_steps(&self) -> Result<Vec<usize>> {
+        let mut active_steps = Vec::new();
+        
+        for (step_index, step) in self.flow.steps.iter().enumerate() {
+            if step.streaming {
+                // Check if this step is currently running or ready to run
+                let step_status = self.state_store
+                    .get_step_status(self.execution_id(), step_index)
+                    .await
+                    .map_err(|e| error_stack::report!(ExecutionError::StateError).attach_printable(format!("State error: {e}")))?;
+                match step_status {
+                    stepflow_core::status::StepStatus::Running | 
+                    stepflow_core::status::StepStatus::Runnable => {
+                        active_steps.push(step_index);
+                    }
+                    _ => {}
+                }
+            }
+        }
+        
+        Ok(active_steps)
+    }
 }
 
 /// Execute a single step asynchronously.
@@ -963,6 +1039,7 @@ pub struct StepInspection {
 /// Coordinates streaming execution between multiple steps in a pipeline
 struct StreamingPipelineCoordinator {
     executor: Arc<StepFlowExecutor>,
+    flow: Arc<Flow>,
     pipeline_steps: Vec<usize>,
     context: ExecutionContext,
     step_connections: std::collections::HashMap<usize, tokio::sync::mpsc::Sender<FlowResult>>,
@@ -972,6 +1049,7 @@ struct StreamingPipelineCoordinator {
 impl StreamingPipelineCoordinator {
     fn new(
         executor: Arc<StepFlowExecutor>,
+        flow: Arc<Flow>,
         pipeline_steps: Vec<usize>,
         context: ExecutionContext,
     ) -> Self {
@@ -987,6 +1065,7 @@ impl StreamingPipelineCoordinator {
 
         Self {
             executor,
+            flow,
             pipeline_steps,
             context,
             step_connections,
@@ -995,25 +1074,67 @@ impl StreamingPipelineCoordinator {
     }
 
     async fn execute_pipeline(&mut self) -> Result<()> {
-        // For now, we'll just log that we're executing a streaming pipeline
-        // In a full implementation, this would coordinate all the streaming steps
         tracing::info!("Executing streaming pipeline with {} steps", self.pipeline_steps.len());
         
-        // TODO: Implement full streaming pipeline coordination
-        // This would involve:
-        // 1. Starting all streaming steps in parallel
-        // 2. Setting up channels between steps
-        // 3. Routing chunks between steps
-        // 4. Handling backpressure and flow control
+        // Create tasks for each streaming step
+        let mut tasks = Vec::new();
+        let flow_arc = self.flow.clone();
+        
+        for &step_index in &self.pipeline_steps {
+            let flow_arc = flow_arc.clone();
+            let step_input = self.resolve_step_input(step_index).await?;
+            let downstream_senders = self.get_downstream_senders(step_index);
+            
+            if let Some(receiver) = self.step_receivers.remove(&step_index) {
+                let executor = self.executor.clone();
+                let context = self.context.clone();
+                let task = tokio::spawn(async move {
+                    let step = &flow_arc.steps[step_index];
+                    Self::run_streaming_step(
+                        executor,
+                        step,
+                        step_input,
+                        context,
+                        receiver,
+                        downstream_senders,
+                    ).await
+                });
+                tasks.push(task);
+            }
+        }
+        
+        // Wait for all streaming steps to complete
+        for task in tasks {
+            task.await.map_err(|_e| ExecutionError::StepFailed { 
+                step: "streaming_pipeline".to_string() 
+            })??;
+        }
         
         Ok(())
     }
+    
+    async fn resolve_step_input(&self, step_index: usize) -> Result<stepflow_core::workflow::ValueRef> {
+        // Create a basic input for streaming steps
+        // In a full implementation, this would resolve dependencies from previous steps
+        let step = &self.flow.steps[step_index];
+        
+        // For streaming steps, we typically need some basic configuration
+        let input = serde_json::json!({
+            "step_id": step.id,
+            "step_index": step_index,
+            "streaming": true,
+            "component": step.component.to_string()
+        });
+        
+        Ok(stepflow_core::workflow::ValueRef::new(input))
+    }
 
     fn get_downstream_senders(&self, step_index: usize) -> Vec<tokio::sync::mpsc::Sender<FlowResult>> {
         let mut senders = Vec::new();
         
+        // Find steps that come after this step in the pipeline
         for &other_step_index in &self.pipeline_steps {
-            if other_step_index != step_index {
+            if other_step_index > step_index {
                 if let Some(sender) = self.step_connections.get(&other_step_index) {
                     senders.push(sender.clone());
                 }
@@ -1022,6 +1143,29 @@ impl StreamingPipelineCoordinator {
         
         senders
     }
+    
+    async fn route_chunk_to_step(&mut self, step_index: usize, chunk: serde_json::Value) -> Result<()> {
+        if let Some(sender) = self.step_connections.get(&step_index) {
+            let flow_result = FlowResult::Streaming {
+                stream_id: "routed_chunk".to_string(),
+                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!({})),
+                chunk: chunk.to_string(),
+                chunk_index: 0,
+                is_final: false,
+            };
+            
+            sender.send(flow_result).await
+                .map_err(|e| ExecutionError::StepFailed { 
+                    step: format!("step_{}", step_index) 
+                })?;
+            
+            tracing::debug!("Successfully routed chunk to step {}", step_index);
+        } else {
+            tracing::warn!("No sender found for step {}", step_index);
+        }
+        
+        Ok(())
+    }
 
     async fn run_streaming_step(
         executor: Arc<StepFlowExecutor>,
diff --git a/crates/stepflow-protocol/src/blob_handlers.rs b/crates/stepflow-protocol/src/blob_handlers.rs
index 62aa8ae5..96ed90f6 100644
--- a/crates/stepflow-protocol/src/blob_handlers.rs
+++ b/crates/stepflow-protocol/src/blob_handlers.rs
@@ -184,11 +184,12 @@ impl IncomingHandler for StreamingChunkHandler {
                     if let Some(executor) = context.executor() {
                         if let Ok(execution_id) = Uuid::parse_str(&notification.request_id) {
                             // Try to find the workflow executor for this execution
-                            if let Ok(Some(_boxed_executor)) = executor.get_workflow_executor(execution_id).await {
+                            if let Ok(Some(mut workflow_executor)) = executor.get_workflow_executor(execution_id).await {
                                 // For now, just log that we received the chunk
                                 // TODO: Implement proper chunk routing when the streaming pipeline is ready
                                 tracing::info!("Received streaming chunk for execution {}: {:?}", 
                                               execution_id, notification.chunk);
+                                tracing::warn!("Streaming chunk routing not yet implemented for trait objects");
                             } else {
                                 tracing::warn!("No workflow executor found for execution ID: {}", execution_id);
                             }
diff --git a/crates/stepflow-state-sql/src/sqlite_state_store.rs b/crates/stepflow-state-sql/src/sqlite_state_store.rs
index 0ae09434..28b5c2a5 100644
--- a/crates/stepflow-state-sql/src/sqlite_state_store.rs
+++ b/crates/stepflow-state-sql/src/sqlite_state_store.rs
@@ -1005,7 +1005,45 @@ impl StateStore for SqliteStateStore {
             }
 
             Ok(runnable_steps)
-        }
-        .boxed()
+        }.boxed()
+    }
+
+    fn get_step_status(
+        &self,
+        execution_id: Uuid,
+        step_index: usize,
+    ) -> BoxFuture<'_, error_stack::Result<stepflow_core::status::StepStatus, StateError>> {
+        let pool = self.pool.clone();
+        
+        async move {
+            let sql = "SELECT status FROM step_info WHERE execution_id = ? AND step_index = ?";
+
+            let row = sqlx::query(sql)
+                .bind(execution_id.to_string())
+                .bind(step_index as i64)
+                .fetch_optional(&pool)
+                .await
+                .change_context(StateError::Internal)?;
+
+            let row = row.ok_or_else(|| {
+                error_stack::report!(StateError::StepResultNotFoundByIndex {
+                    execution_id: execution_id.to_string(),
+                    step_idx: step_index,
+                })
+            })?;
+
+            let status_str: String = row.get("status");
+            let status = match status_str.as_str() {
+                "blocked" => stepflow_core::status::StepStatus::Blocked,
+                "runnable" => stepflow_core::status::StepStatus::Runnable,
+                "running" => stepflow_core::status::StepStatus::Running,
+                "completed" => stepflow_core::status::StepStatus::Completed,
+                "failed" => stepflow_core::status::StepStatus::Failed,
+                "skipped" => stepflow_core::status::StepStatus::Skipped,
+                _ => stepflow_core::status::StepStatus::Blocked, // Default fallback
+            };
+
+            Ok(status)
+        }.boxed()
     }
 }
diff --git a/crates/stepflow-state/src/in_memory.rs b/crates/stepflow-state/src/in_memory.rs
index 5503c00a..90e663e7 100644
--- a/crates/stepflow-state/src/in_memory.rs
+++ b/crates/stepflow-state/src/in_memory.rs
@@ -688,30 +688,46 @@ impl StateStore for InMemoryStateStore {
         &self,
         execution_id: uuid::Uuid,
     ) -> BoxFuture<'_, error_stack::Result<Vec<StepInfo>, crate::StateError>> {
-        let step_info_map = self.step_info.clone();
+        let step_info = self.step_info.clone();
 
         async move {
-            let step_info_guard = step_info_map.read().await;
+            let step_info = step_info.read().await;
+            let execution_steps = step_info.get(&execution_id).ok_or_else(|| {
+                error_stack::report!(crate::StateError::ExecutionNotFound { execution_id })
+            })?;
 
-            // Get all step info for this execution
-            let execution_steps = step_info_guard
-                .get(&execution_id)
+            let runnable_steps: Vec<StepInfo> = execution_steps
+                .values()
+                .filter(|step| matches!(step.status, stepflow_core::status::StepStatus::Runnable))
                 .cloned()
-                .unwrap_or_default();
+                .collect();
+
+            Ok(runnable_steps)
+        }
+        .boxed()
+    }
 
-            // Find steps that are marked as runnable
-            let mut runnable_steps = Vec::new();
+    fn get_step_status(
+        &self,
+        execution_id: uuid::Uuid,
+        step_index: usize,
+    ) -> BoxFuture<'_, error_stack::Result<stepflow_core::status::StepStatus, crate::StateError>> {
+        let step_info = self.step_info.clone();
 
-            for step_info in execution_steps.values() {
-                if step_info.status == stepflow_core::status::StepStatus::Runnable {
-                    runnable_steps.push(step_info.clone());
-                }
-            }
+        async move {
+            let step_info = step_info.read().await;
+            let execution_steps = step_info.get(&execution_id).ok_or_else(|| {
+                error_stack::report!(crate::StateError::ExecutionNotFound { execution_id })
+            })?;
 
-            // Sort by step_index for consistent ordering
-            runnable_steps.sort_by_key(|step| step.step_index);
+            let step = execution_steps.get(&step_index).ok_or_else(|| {
+                error_stack::report!(crate::StateError::StepResultNotFoundByIndex {
+                    execution_id: execution_id.to_string(),
+                    step_idx: step_index,
+                })
+            })?;
 
-            Ok(runnable_steps)
+            Ok(step.status)
         }
         .boxed()
     }
diff --git a/crates/stepflow-state/src/state_store.rs b/crates/stepflow-state/src/state_store.rs
index fd2d6174..bd3e0850 100644
--- a/crates/stepflow-state/src/state_store.rs
+++ b/crates/stepflow-state/src/state_store.rs
@@ -305,6 +305,20 @@ pub trait StateStore: Send + Sync {
         &self,
         execution_id: Uuid,
     ) -> BoxFuture<'_, error_stack::Result<Vec<StepInfo>, StateError>>;
+
+    /// Get the status of a specific step.
+    ///
+    /// # Arguments
+    /// * `execution_id` - The unique identifier for the workflow execution
+    /// * `step_index` - The index of the step within the workflow (0-based)
+    ///
+    /// # Returns
+    /// The step status if found, or an error if not found
+    fn get_step_status(
+        &self,
+        execution_id: Uuid,
+        step_index: usize,
+    ) -> BoxFuture<'_, error_stack::Result<stepflow_core::status::StepStatus, StateError>>;
 }
 
 /// The step result.
diff --git a/examples/audio_input.json b/examples/audio_input.json
index 2e0e7023..25a274dd 100644
--- a/examples/audio_input.json
+++ b/examples/audio_input.json
@@ -1,12 +1,11 @@
 {
+  "source": "microphone",
   "operation": "amplify",
-  "sample_rate": 16000,
+  "sample_rate": 44100,
   "channels": 1,
   "chunk_size": 1024,
   "frequency": 440.0,
-  "source": "microphone",
   "duration": 3.0,
   "output_file": "test_workflow_webcam.wav",
-  "device_name": "C922 Pro Stream Webcam",
-  "play_audio": true
+  "device_name": "C922 Pro Stream Webcam"
 }
diff --git a/examples/test_audio_pipeline.sh b/examples/test_audio_pipeline.sh
index ddf37a45..c173bbd2 100755
--- a/examples/test_audio_pipeline.sh
+++ b/examples/test_audio_pipeline.sh
@@ -20,7 +20,7 @@ if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
     INPUT_DIR="."
 else
     # Running from root directory
-    INPUT_FILE="examples/input.json"
+    INPUT_FILE="examples/audio_input.json"
     FLOW_FILE="examples/audio-streaming-pipeline.yaml"
     INPUT_DIR="examples"
 fi
@@ -34,48 +34,15 @@ echo "Device: $DEVICE_NAME"
 echo "Running from: $CURRENT_DIR"
 echo ""
 
-# Create input file
+# Run the workflow
 if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
-    # Running from examples directory
-    cat > "$INPUT_FILE" << EOF
-{
-  "operation": "$OPERATION",
-  "sample_rate": 16000,
-  "channels": 1,
-  "chunk_size": 1024,
-  "frequency": 440.0,
-  "source": "$SOURCE",
-  "duration": $DURATION,
-  "output_file": "$OUTPUT_FILE",
-  "device_name": "$DEVICE_NAME",
-  "play_audio": true
-}
-EOF
+    # Running from examples directory - run from current directory
+    cargo run -- run --flow audio-streaming-pipeline.yaml --input audio_input.json
 else
     # Running from root directory
-    cat > "$INPUT_FILE" << EOF
-{
-  "operation": "$OPERATION",
-  "sample_rate": 16000,
-  "channels": 1,
-  "chunk_size": 1024,
-  "frequency": 440.0,
-  "source": "$SOURCE",
-  "duration": $DURATION,
-  "output_file": "$OUTPUT_FILE",
-  "device_name": "$DEVICE_NAME",
-  "play_audio": true
-}
-EOF
+    cargo run -- run --flow examples/audio-streaming-pipeline.yaml --input examples/audio_input.json
 fi
 
-# Run the workflow
-cd examples
-cargo run --bin stepflow -- run \
-  --flow audio-streaming-pipeline.yaml \
-  --input input.json
-cd ..
-
 echo ""
 echo "✅ Test completed!"
 echo "📁 Output file: $OUTPUT_FILE"
@@ -91,4 +58,3 @@ else
 fi
 
 # Clean up input file
-rm -f "$INPUT_FILE" 
diff --git a/sdks/python/src/stepflow_sdk/audio_components.py b/sdks/python/src/stepflow_sdk/audio_components.py
index 7517c79f..1668e392 100644
--- a/sdks/python/src/stepflow_sdk/audio_components.py
+++ b/sdks/python/src/stepflow_sdk/audio_components.py
@@ -671,7 +671,7 @@ def record_audio_continuously():
                 
             except Exception as e:
                 print(f"Failed to start recording: {e}", file=sys.stderr)
-        
+    
         # Start recording thread
         recording_thread = threading.Thread(target=record_audio_continuously, daemon=True)
         recording_thread.start()
@@ -723,7 +723,7 @@ def record_audio_continuously():
             
             chunk_end_time = time.time()
             print(f"TIMING: Total chunk {chunk_index} processing took {chunk_end_time - chunk_start_time:.4f}s", file=sys.stderr)
-        
+    
         # Stop recording
         recording_stop.set()
         recording_thread.join(timeout=2.0)

From 6ba8e4ba972b3e42a8aa405c43a373076d7adb69 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Tue, 24 Jun 2025 11:28:18 -0400
Subject: [PATCH 03/14] remove python streaming pipeline

---
 .../src/stepflow_sdk/audio_components.py      | 547 +++---------------
 1 file changed, 71 insertions(+), 476 deletions(-)

diff --git a/sdks/python/src/stepflow_sdk/audio_components.py b/sdks/python/src/stepflow_sdk/audio_components.py
index 1668e392..0a921e9b 100644
--- a/sdks/python/src/stepflow_sdk/audio_components.py
+++ b/sdks/python/src/stepflow_sdk/audio_components.py
@@ -34,311 +34,18 @@ class AudioChunk:
     timestamp: float
 
 
-class StreamingPipeline:
-    """Coordinates streaming audio processing between components."""
-    
-    def __init__(self):
-        self.source_queue = queue.Queue()
-        self.processor_queue = queue.Queue()
-        self.sink_queue = queue.Queue()
-        self.running = False
-        self.threads = []
-    
-    def start_pipeline(self, source_config, processor_config, sink_config):
-        """Start the streaming pipeline with all components."""
-        self.running = True
-        
-        # Start source thread
-        source_thread = threading.Thread(
-            target=self._run_source, 
-            args=(source_config,), 
-            daemon=True
-        )
-        source_thread.start()
-        self.threads.append(source_thread)
-        
-        # Start processor thread
-        processor_thread = threading.Thread(
-            target=self._run_processor, 
-            args=(processor_config,), 
-            daemon=True
-        )
-        processor_thread.start()
-        self.threads.append(processor_thread)
-        
-        # Start sink thread
-        sink_thread = threading.Thread(
-            target=self._run_sink, 
-            args=(sink_config,), 
-            daemon=True
-        )
-        sink_thread.start()
-        self.threads.append(sink_thread)
-        
-        print("TIMING: Started streaming pipeline with 3 threads", file=sys.stderr)
-    
-    def _run_source(self, config):
-        """Run the audio source component."""
-        try:
-            # Initialize audio source
-            source_type = config.get('source', 'microphone')
-            sample_rate = config.get('sample_rate', 16000)
-            channels = config.get('channels', 1)
-            chunk_size = config.get('chunk_size', 1024)
-            duration = config.get('duration', 5.0)
-            device_name = config.get('device_name', None)
-            
-            # Calculate total chunks
-            chunk_duration = chunk_size / sample_rate
-            total_chunks = int(duration / chunk_duration)
-            
-            print(f"TIMING: Source starting with {total_chunks} chunks", file=sys.stderr)
-            
-            if source_type == 'microphone':
-                # Set up continuous recording
-                audio = pyaudio.PyAudio()
-                
-                # Find device
-                device_index = None
-                if device_name:
-                    for i in range(audio.get_device_count()):
-                        info = audio.get_device_info_by_index(i)
-                        if device_name.lower() in info['name'].lower():
-                            device_index = i
-                            break
-                
-                # Auto-detect sample rate
-                if device_index is not None:
-                    sample_rates = [16000, 22050, 44100, 48000]
-                    for rate in sample_rates:
-                        try:
-                            test_stream = audio.open(
-                                format=pyaudio.paInt16,
-                                channels=channels,
-                                rate=rate,
-                                input=True,
-                                input_device_index=device_index,
-                                frames_per_buffer=chunk_size
-                            )
-                            test_stream.close()
-                            sample_rate = rate
-                            break
-                        except OSError:
-                            continue
-                
-                # Start recording
-                stream = audio.open(
-                    format=pyaudio.paInt16,
-                    channels=channels,
-                    rate=sample_rate,
-                    input=True,
-                    input_device_index=device_index,
-                    frames_per_buffer=chunk_size
-                )
-                
-                print(f"TIMING: Started continuous recording at {sample_rate}Hz", file=sys.stderr)
-                
-                # Record and emit chunks
-                for chunk_index in range(total_chunks):
-                    if not self.running:
-                        break
-                    
-                    chunk_start = time.time()
-                    data = stream.read(chunk_size, exception_on_overflow=False)
-                    chunk_time = time.time()
-                    
-                    print(f"TIMING: Source recorded chunk {chunk_index} in {chunk_time - chunk_start:.4f}s", file=sys.stderr)
-                    
-                    # Emit to processor
-                    chunk_data = {
-                        "outcome": "streaming",
-                        "stream_id": str(uuid.uuid4()),
-                        "sample_rate": sample_rate,
-                        "channels": channels,
-                        "chunk_size": len(data),
-                        "format": "pcm_16bit",
-                        "chunk": base64.b64encode(data).decode('utf-8'),
-                        "chunk_index": chunk_index,
-                        "is_final": chunk_index >= total_chunks - 1
-                    }
-                    
-                    self.source_queue.put(chunk_data)
-                
-                stream.stop_stream()
-                stream.close()
-                audio.terminate()
-                
-            else:
-                # Generate test data
-                for chunk_index in range(total_chunks):
-                    if not self.running:
-                        break
-                    
-                    # Generate sine wave
-                    import math
-                    samples = []
-                    for i in range(chunk_size):
-                        t = (i + chunk_index * chunk_size) / sample_rate
-                        sample = int(32767 * 0.3 * math.sin(2 * math.pi * 440.0 * t))
-                        samples.append(sample)
-                    
-                    data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in samples)
-                    
-                    chunk_data = {
-                        "outcome": "streaming",
-                        "stream_id": str(uuid.uuid4()),
-                        "sample_rate": sample_rate,
-                        "channels": channels,
-                        "chunk_size": len(data),
-                        "format": "pcm_16bit",
-                        "chunk": base64.b64encode(data).decode('utf-8'),
-                        "chunk_index": chunk_index,
-                        "is_final": chunk_index >= total_chunks - 1
-                    }
-                    
-                    self.source_queue.put(chunk_data)
-            
-            print("TIMING: Source completed", file=sys.stderr)
-            
-        except Exception as e:
-            print(f"ERROR: Source failed: {e}", file=sys.stderr)
-    
-    def _run_processor(self, config):
-        """Run the audio processor component."""
-        try:
-            operation = config.get('operation', 'passthrough')
-            print(f"TIMING: Processor starting with operation: {operation}", file=sys.stderr)
-            
-            while self.running:
-                try:
-                    # Get chunk from source (with timeout)
-                    source_chunk = self.source_queue.get(timeout=1.0)
-                    
-                    if source_chunk.get('is_final', False):
-                        # Pass through final chunk
-                        self.processor_queue.put(source_chunk)
-                        break
-                    
-                    chunk_start = time.time()
-                    
-                    # Process the chunk
-                    if operation == 'amplify':
-                        # Decode and amplify
-                        chunk_data = base64.b64decode(source_chunk['chunk'])
-                        samples = []
-                        for i in range(0, len(chunk_data), 2):
-                            sample = int.from_bytes(chunk_data[i:i+2], 'little', signed=True)
-                            samples.append(sample)
-                        
-                        # Amplify
-                        gain = config.get('gain', 2.0)
-                        amplified_samples = [int(sample * gain) for sample in samples]
-                        amplified_data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in amplified_samples)
-                        amplified_b64 = base64.b64encode(amplified_data).decode('utf-8')
-                        
-                        processed_chunk = {
-                            **source_chunk,
-                            "chunk": amplified_b64,
-                            "operation": "amplify",
-                            "gain": gain
-                        }
-                    else:
-                        # Passthrough
-                        processed_chunk = {**source_chunk, "operation": "passthrough"}
-                    
-                    chunk_time = time.time()
-                    print(f"TIMING: Processor processed chunk {source_chunk['chunk_index']} in {chunk_time - chunk_start:.4f}s", file=sys.stderr)
-                    
-                    # Emit to sink
-                    self.processor_queue.put(processed_chunk)
-                    
-                except queue.Empty:
-                    continue
-            
-            print("TIMING: Processor completed", file=sys.stderr)
-            
-        except Exception as e:
-            print(f"ERROR: Processor failed: {e}", file=sys.stderr)
-    
-    def _run_sink(self, config):
-        """Run the audio sink component."""
-        try:
-            output_file = config.get('output_file', 'output_audio.wav')
-            all_chunks = []
-            
-            print(f"TIMING: Sink starting, will write to {output_file}", file=sys.stderr)
-            
-            while self.running:
-                try:
-                    # Get chunk from processor (with timeout)
-                    processed_chunk = self.processor_queue.get(timeout=1.0)
-                    
-                    chunk_start = time.time()
-                    
-                    # Decode and store chunk
-                    chunk_data = base64.b64decode(processed_chunk['chunk'])
-                    all_chunks.append(chunk_data)
-                    
-                    chunk_time = time.time()
-                    print(f"TIMING: Sink received chunk {processed_chunk['chunk_index']} in {chunk_time - chunk_start:.4f}s", file=sys.stderr)
-                    
-                    if processed_chunk.get('is_final', False):
-                        break
-                        
-                except queue.Empty:
-                    continue
-            
-            # Write WAV file
-            if all_chunks:
-                try:
-                    all_audio_data = b''.join(all_chunks)
-                    sample_rate = processed_chunk.get('sample_rate', 16000)
-                    channels = processed_chunk.get('channels', 1)
-                    
-                    with wave.open(output_file, 'wb') as wav_file:
-                        wav_file.setnchannels(channels)
-                        wav_file.setsampwidth(2)  # 16-bit
-                        wav_file.setframerate(sample_rate)
-                        wav_file.writeframes(all_audio_data)
-                    
-                    print(f"TIMING: Sink wrote {len(all_audio_data)} bytes to {output_file}", file=sys.stderr)
-                    
-                except Exception as e:
-                    print(f"ERROR: Failed to write WAV file: {e}", file=sys.stderr)
-            
-            print("TIMING: Sink completed", file=sys.stderr)
-            
-        except Exception as e:
-            print(f"ERROR: Sink failed: {e}", file=sys.stderr)
-    
-    def stop_pipeline(self):
-        """Stop the streaming pipeline."""
-        self.running = False
-        for thread in self.threads:
-            thread.join(timeout=2.0)
-        print("TIMING: Pipeline stopped", file=sys.stderr)
-
-
-# Global pipeline instance
-_pipeline = None
-
-
 class AudioStreamSource:
-    """Component that generates PCM 16-bit audio chunks from a source."""
+    """Individual audio source component for generating audio chunks."""
     
     def __init__(self, sample_rate: int = 16000, channels: int = 1, chunk_size: int = 1024):
         self.sample_rate = sample_rate
         self.channels = channels
         self.chunk_size = chunk_size
         self.stream_id = str(uuid.uuid4())
-        self.chunk_index = 0
-        self.audio = pyaudio.PyAudio()
-        self.stream = None
-        self.is_recording = False
-        self.audio_queue = queue.Queue()
-        
+    
     def start_microphone_stream(self):
-        """Start recording from microphone."""
+        """Initialize microphone stream."""
+        self.audio = pyaudio.PyAudio()
         self.stream = self.audio.open(
             format=pyaudio.paInt16,
             channels=self.channels,
@@ -346,175 +53,105 @@ def start_microphone_stream(self):
             input=True,
             frames_per_buffer=self.chunk_size
         )
-        self.is_recording = True
-        
-        # Start recording thread
-        threading.Thread(target=self._record_audio, daemon=True).start()
-        
+    
     def _record_audio(self):
-        """Record audio in background thread."""
-        try:
-            while self.is_recording:
-                if self.stream:
-                    data = self.stream.read(self.chunk_size, exception_on_overflow=False)
-                    self.audio_queue.put(data)
-        except Exception as e:
-            print(f"Recording error: {e}")
-            
+        """Record a single chunk of audio."""
+        return self.stream.read(self.chunk_size, exception_on_overflow=False)
+    
     def stop_microphone_stream(self):
-        """Stop recording from microphone."""
-        self.is_recording = False
-        if self.stream:
+        """Stop and clean up microphone stream."""
+        if hasattr(self, 'stream'):
             self.stream.stop_stream()
             self.stream.close()
-        if self.audio:
+        if hasattr(self, 'audio'):
             self.audio.terminate()
-        
+    
     def get_microphone_chunk(self) -> AudioChunk:
-        """Get a chunk from microphone input."""
-        try:
-            data = self.audio_queue.get(timeout=1.0)  # 1 second timeout
-            chunk = AudioChunk(
-                data=data,
-                sample_rate=self.sample_rate,
-                channels=self.channels,
-                chunk_index=self.chunk_index,
-                timestamp=time.time()
-            )
-            self.chunk_index += 1
-            return chunk
-        except queue.Empty:
-            # Return silence if no audio available
-            silence_data = b'\x00' * (self.chunk_size * 2)  # 16-bit = 2 bytes per sample
-            chunk = AudioChunk(
-                data=silence_data,
-                sample_rate=self.sample_rate,
-                channels=self.channels,
-                chunk_index=self.chunk_index,
-                timestamp=time.time()
-            )
-            self.chunk_index += 1
-            return chunk
-        
+        """Get a single chunk of audio from microphone."""
+        data = self._record_audio()
+        return AudioChunk(
+            data=data,
+            sample_rate=self.sample_rate,
+            channels=self.channels,
+            chunk_index=0,
+            timestamp=time.time()
+        )
+    
     def generate_sine_wave_chunk(self, frequency: float = 440.0, duration: float = 0.1) -> AudioChunk:
         """Generate a sine wave chunk for testing."""
         import math
         
-        # Generate sine wave samples
         samples = []
         for i in range(self.chunk_size):
-            t = (i + self.chunk_index * self.chunk_size) / self.sample_rate
+            t = i / self.sample_rate
             sample = int(32767 * 0.3 * math.sin(2 * math.pi * frequency * t))
             samples.append(sample)
         
-        # Convert to bytes (16-bit little-endian)
         data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in samples)
         
-        chunk = AudioChunk(
+        return AudioChunk(
             data=data,
             sample_rate=self.sample_rate,
             channels=self.channels,
-            chunk_index=self.chunk_index,
+            chunk_index=0,
             timestamp=time.time()
         )
-        
-        self.chunk_index += 1
-        return chunk
-
+    
     def start_system_audio_stream(self):
-        """Start capturing system audio (speaker output)."""
-        try:
-            # Try to use PulseAudio loopback device first
-            self.stream = self.audio.open(
-                format=pyaudio.paInt16,
-                channels=self.channels,
-                rate=self.sample_rate,
-                input=True,
-                input_device_index=self._find_system_audio_device(),
-                frames_per_buffer=self.chunk_size
-            )
-            self.is_recording = True
-            print(f"Started system audio capture at {self.sample_rate}Hz")
-        except Exception as e:
-            print(f"Failed to start system audio capture: {e}")
-            # Fallback to default input device
-            self.stream = self.audio.open(
-                format=pyaudio.paInt16,
-                channels=self.channels,
-                rate=self.sample_rate,
-                input=True,
-                frames_per_buffer=self.chunk_size
-            )
-            self.is_recording = True
-            print(f"Fell back to default audio input at {self.sample_rate}Hz")
+        """Initialize system audio capture (if sounddevice is available)."""
+        if not SOUNDDEVICE_AVAILABLE:
+            raise ImportError("sounddevice not available for system audio capture")
+        
+        # Find system audio device
+        self.device_info = self._find_system_audio_device()
+        if not self.device_info:
+            raise RuntimeError("No suitable system audio device found")
+        
+        print(f"Using system audio device: {self.device_info['name']}", file=sys.stderr)
     
     def _find_system_audio_device(self):
-        """Find a suitable system audio capture device."""
-        try:
-            # List available devices
-            device_count = self.audio.get_device_count()
-            print(f"Found {device_count} audio devices:")
-            
-            for i in range(device_count):
-                device_info = self.audio.get_device_info_by_index(i)
-                name = device_info.get('name', 'Unknown')
-                max_inputs = device_info.get('maxInputChannels', 0)
-                print(f"  Device {i}: {name} (inputs: {max_inputs})")
-                
-                # Look for loopback, monitor, or system audio devices
-                if (max_inputs > 0 and 
-                    any(keyword in name.lower() for keyword in 
-                        ['loopback', 'monitor', 'system', 'speaker', 'output'])):
-                    print(f"  Selected system audio device: {name}")
-                    return i
-            
-            # If no specific system audio device found, try default
-            print("No specific system audio device found, using default")
-            return None
-            
-        except Exception as e:
-            print(f"Error finding system audio device: {e}")
-            return None
+        """Find a suitable system audio device."""
+        devices = sd.query_devices()
+        
+        # Look for output devices that can be used for loopback
+        for device in devices:
+            if device['max_inputs'] > 0 and device['max_outputs'] > 0:
+                # This device supports both input and output (potential loopback)
+                return device
+        
+        # Fallback to default device
+        return sd.query_devices(kind='input')
     
     def get_system_audio_chunk(self):
-        """Get a chunk of system audio data."""
-        if not self.is_recording or not self.stream:
-            raise RuntimeError("System audio stream not started")
+        """Get a single chunk of system audio."""
+        if not SOUNDDEVICE_AVAILABLE:
+            raise ImportError("sounddevice not available")
+        
+        # Record a chunk of system audio
+        recording = sd.rec(
+            int(self.chunk_size),
+            samplerate=self.sample_rate,
+            channels=self.channels,
+            dtype='int16',
+            device=self.device_info['index']
+        )
+        sd.wait()
         
-        try:
-            # Read audio data
-            data = self.stream.read(self.chunk_size, exception_on_overflow=False)
-            
-            # Create audio chunk
-            chunk = AudioChunk(
-                data=data,
-                sample_rate=self.sample_rate,
-                channels=self.channels,
-                chunk_index=self.chunk_index,
-                timestamp=time.time()
-            )
-            
-            self.chunk_index += 1
-            return chunk
-            
-        except Exception as e:
-            print(f"Error reading system audio: {e}")
-            # Return silence on error
-            silence_data = b'\x00' * (self.chunk_size * 2)
-            chunk = AudioChunk(
-                data=silence_data,
-                sample_rate=self.sample_rate,
-                channels=self.channels,
-                chunk_index=self.chunk_index,
-                timestamp=time.time()
-            )
-            self.chunk_index += 1
-            return chunk
+        # Convert to bytes
+        data = recording.tobytes()
+        
+        return AudioChunk(
+            data=data,
+            sample_rate=self.sample_rate,
+            channels=self.channels,
+            chunk_index=0,
+            timestamp=time.time()
+        )
 
 
 def audio_stream_source(data: Dict[str, Any], context=None):
     """
-    Component that generates audio stream chunks using continuous background recording.
+    Component that generates audio stream chunks.
     
     Input:
         source: str - audio source type ("sine_wave", "microphone", "system_audio")
@@ -529,48 +166,6 @@ def audio_stream_source(data: Dict[str, Any], context=None):
     Output:
         Streaming audio chunks with metadata
     """
-    global _pipeline
-    
-    # Check if we should use the streaming pipeline
-    use_pipeline = data.get('use_pipeline', False)
-    
-    if use_pipeline and _pipeline is None:
-        # Start the streaming pipeline
-        _pipeline = StreamingPipeline()
-        
-        # Extract configs for each component
-        source_config = {
-            'source': data.get('source', 'microphone'),
-            'sample_rate': data.get('sample_rate', 16000),
-            'channels': data.get('channels', 1),
-            'chunk_size': data.get('chunk_size', 1024),
-            'duration': data.get('duration', 5.0),
-            'device_name': data.get('device_name', None),
-            'frequency': data.get('frequency', 440.0)
-        }
-        
-        processor_config = {
-            'operation': data.get('operation', 'passthrough'),
-            'gain': data.get('gain', 2.0)
-        }
-        
-        sink_config = {
-            'output_file': data.get('output_file', 'output_audio.wav')
-        }
-        
-        # Start the pipeline
-        _pipeline.start_pipeline(source_config, processor_config, sink_config)
-        
-        # Return a simple success response since the pipeline is running
-        return {
-            "outcome": "success",
-            "result": {
-                "message": "Streaming pipeline started",
-                "pipeline_id": str(uuid.uuid4())
-            }
-        }
-    
-    # Fallback to the original implementation for non-pipeline mode
     import time
     start_time = time.time()
     

From a4d19f5ba74420c11f22e2309772e6b8b9c15f5f Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Tue, 24 Jun 2025 11:33:43 -0400
Subject: [PATCH 04/14] improve test script

---
 examples/test_audio_pipeline.sh | 69 ++++++++++++++++++++++++++++-----
 1 file changed, 59 insertions(+), 10 deletions(-)

diff --git a/examples/test_audio_pipeline.sh b/examples/test_audio_pipeline.sh
index c173bbd2..5d72f5c5 100755
--- a/examples/test_audio_pipeline.sh
+++ b/examples/test_audio_pipeline.sh
@@ -2,45 +2,90 @@
 
 # Audio Pipeline Test Script
 # Usage: ./test_audio_pipeline.sh [source] [operation] [duration] [output_file] [device_name]
+# Can be run from either the examples directory or the repo root directory
 
-SOURCE=${1:-"microphone"}
-OPERATION=${2:-"amplify"}
-DURATION=${3:-"3.0"}
-OUTPUT_FILE=${4:-"test_workflow_webcam.wav"}
-DEVICE_NAME=${5:-"C922 Pro Stream Webcam"}
+set -e  # Exit on any error
 
-# Detect if we're running from examples directory or root
+# Get script directory and current working directory
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 CURRENT_DIR="$(pwd)"
 
+# Determine if we're running from examples directory or root
 if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
     # Running from examples directory
     INPUT_FILE="audio_input.json"
     FLOW_FILE="audio-streaming-pipeline.yaml"
+    CONFIG_FILE="stepflow-config.yml"
     INPUT_DIR="."
+    echo "📍 Running from examples directory"
 else
     # Running from root directory
     INPUT_FILE="examples/audio_input.json"
     FLOW_FILE="examples/audio-streaming-pipeline.yaml"
+    CONFIG_FILE="examples/stepflow-config.yml"
     INPUT_DIR="examples"
+    echo "📍 Running from repo root directory"
+fi
+
+# Check if required files exist
+if [[ ! -f "$INPUT_FILE" ]]; then
+    echo "❌ Error: Input file not found: $INPUT_FILE"
+    exit 1
+fi
+
+if [[ ! -f "$FLOW_FILE" ]]; then
+    echo "❌ Error: Flow file not found: $FLOW_FILE"
+    exit 1
+fi
+
+if [[ ! -f "$CONFIG_FILE" ]]; then
+    echo "❌ Error: Config file not found: $CONFIG_FILE"
+    exit 1
 fi
 
+# Parse command line arguments (all optional)
+SOURCE=${1:-"microphone"}
+OPERATION=${2:-"amplify"}
+DURATION=${3:-"3.0"}
+OUTPUT_FILE=${4:-"test_workflow_webcam.wav"}
+DEVICE_NAME=${5:-"C922 Pro Stream Webcam"}
+
 echo "🎵 Testing Audio Streaming Pipeline"
 echo "Source: $SOURCE"
 echo "Operation: $OPERATION"
 echo "Duration: ${DURATION}s"
 echo "Output: $OUTPUT_FILE"
 echo "Device: $DEVICE_NAME"
-echo "Running from: $CURRENT_DIR"
+echo ""
+
+# Create a temporary input file with the provided parameters
+TEMP_INPUT=$(mktemp --suffix=.json)
+cat > "$TEMP_INPUT" << EOF
+{
+  "source": "$SOURCE",
+  "operation": "$OPERATION",
+  "sample_rate": 44100,
+  "channels": 1,
+  "chunk_size": 1024,
+  "frequency": 440.0,
+  "duration": $DURATION,
+  "output_file": "$OUTPUT_FILE",
+  "device_name": "$DEVICE_NAME"
+}
+EOF
+
+echo "📝 Using input configuration:"
+cat "$TEMP_INPUT"
 echo ""
 
 # Run the workflow
+echo "🚀 Starting workflow execution..."
 if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
     # Running from examples directory - run from current directory
-    cargo run -- run --flow audio-streaming-pipeline.yaml --input audio_input.json
+    cargo run -- run --flow "$FLOW_FILE" --input "$TEMP_INPUT"
 else
     # Running from root directory
-    cargo run -- run --flow examples/audio-streaming-pipeline.yaml --input examples/audio_input.json
+    cargo run -- run --flow "$FLOW_FILE" --input "$TEMP_INPUT"
 fi
 
 echo ""
@@ -57,4 +102,8 @@ else
     echo "❌ Output file not found"
 fi
 
-# Clean up input file
+# Clean up temporary input file
+rm -f "$TEMP_INPUT"
+
+echo ""
+echo "🎉 Audio pipeline test finished!"

From 1bc5c2927fbccb95984e318b8fea3c1af2f79aed Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Tue, 24 Jun 2025 12:39:48 -0400
Subject: [PATCH 05/14] persist step state and exit condition

---
 .../src/workflow_executor.rs                  | 185 +++++++++++++++++-
 1 file changed, 175 insertions(+), 10 deletions(-)

diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index b3eb1ea2..24fd0782 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -160,6 +160,23 @@ impl WorkflowExecutor {
             // Update tracker and store result
             let newly_unblocked = self.tracker.complete_step(completed_step_index);
 
+            // Update step status based on result
+            let final_status = match &step_result {
+                FlowResult::Success { .. } => stepflow_core::status::StepStatus::Completed,
+                FlowResult::Failed { .. } => stepflow_core::status::StepStatus::Failed,
+                FlowResult::Skipped => stepflow_core::status::StepStatus::Skipped,
+                FlowResult::Streaming { .. } => stepflow_core::status::StepStatus::Running, // Keep as running for streaming
+            };
+
+            self.state_store
+                .update_step_status(
+                    self.context.execution_id(),
+                    completed_step_index,
+                    final_status,
+                )
+                .await
+                .change_context_lazy(|| ExecutionError::StateError)?;
+
             // Record the completed result in the state store
             let step_id = &self.flow.steps[completed_step_index].id;
             tracing::debug!(
@@ -311,7 +328,18 @@ impl WorkflowExecutor {
             })?;
 
         // Keep executing until the target step is runnable or completed
+        let max_iterations = 1000; // Safety limit to prevent infinite loops
+        let mut iteration_count = 0;
+        
         loop {
+            iteration_count += 1;
+            if iteration_count > max_iterations {
+                tracing::error!("execute_until_runnable exceeded maximum iterations ({}), stopping execution", max_iterations);
+                return Err(ExecutionError::StepFailed { 
+                    step: format!("execute_until_runnable for {}", target_step_id) 
+                }.into());
+            }
+            
             let runnable = self.tracker.unblocked_steps();
 
             // Check if target step is runnable
@@ -433,10 +461,31 @@ impl WorkflowExecutor {
             .into());
         }
 
+        // Update step status to Running
+        self.state_store
+            .update_step_status(
+                self.context.execution_id(),
+                step_index,
+                stepflow_core::status::StepStatus::Running,
+            )
+            .await
+            .change_context_lazy(|| ExecutionError::StateError)?;
+
         // Check skip condition if present
         if let Some(skip_if) = &step.skip_if {
             if self.should_skip_step(skip_if).await? {
                 let result = FlowResult::Skipped;
+                
+                // Update step status to Skipped
+                self.state_store
+                    .update_step_status(
+                        self.context.execution_id(),
+                        step_index,
+                        stepflow_core::status::StepStatus::Skipped,
+                    )
+                    .await
+                    .change_context_lazy(|| ExecutionError::StateError)?;
+                
                 self.record_step_completion(step_index, &result).await?;
                 return Ok(StepExecutionResult::new(
                     step_index,
@@ -470,6 +519,23 @@ impl WorkflowExecutor {
         let plugin = self.executor.get_plugin(&step.component).await?;
         let result = execute_step_async(plugin, step, step_input, self.context.clone()).await?;
 
+        // Update step status based on result
+        let final_status = match &result {
+            FlowResult::Success { .. } => stepflow_core::status::StepStatus::Completed,
+            FlowResult::Failed { .. } => stepflow_core::status::StepStatus::Failed,
+            FlowResult::Skipped => stepflow_core::status::StepStatus::Skipped,
+            FlowResult::Streaming { .. } => stepflow_core::status::StepStatus::Running, // Keep as running for streaming
+        };
+
+        self.state_store
+            .update_step_status(
+                self.context.execution_id(),
+                step_index,
+                final_status,
+            )
+            .await
+            .change_context_lazy(|| ExecutionError::StateError)?;
+
         // For streaming steps, don't record in state store
         if step.streaming {
             // Update dependency tracker but don't persist
@@ -626,6 +692,16 @@ impl WorkflowExecutor {
         let newly_unblocked_from_skip = self.tracker.complete_step(step_index);
         let skip_result = FlowResult::Skipped;
 
+        // Update step status to Skipped
+        self.state_store
+            .update_step_status(
+                self.context.execution_id(),
+                step_index,
+                stepflow_core::status::StepStatus::Skipped,
+            )
+            .await
+            .change_context_lazy(|| ExecutionError::StateError)?;
+
         // Record the skipped result in the state store
         self.state_store
             .record_step_result(
@@ -658,6 +734,16 @@ impl WorkflowExecutor {
         let step = &self.flow.steps[step_index];
         tracing::debug!("Starting execution of step {}", step.id);
 
+        // Update step status to Running
+        self.state_store
+            .update_step_status(
+                self.context.execution_id(),
+                step_index,
+                stepflow_core::status::StepStatus::Running,
+            )
+            .await
+            .change_context_lazy(|| ExecutionError::StateError)?;
+
         // Get plugin for this step
         let plugin = self.executor.get_plugin(&step.component).await?;
 
@@ -742,6 +828,16 @@ impl WorkflowExecutor {
 
         tracing::info!("Executing streaming pipeline step: {}", step_id);
 
+        // Update step status to Running
+        self.state_store
+            .update_step_status(
+                self.context.execution_id(),
+                step_index,
+                stepflow_core::status::StepStatus::Running,
+            )
+            .await
+            .change_context_lazy(|| ExecutionError::StateError)?;
+
         // Find all streaming steps in the pipeline
         let pipeline_steps = self.find_streaming_pipeline_steps(step_index);
         
@@ -755,7 +851,33 @@ impl WorkflowExecutor {
         self.streaming_coordinator = Some(coordinator.clone());
 
         // Execute the entire pipeline
-        coordinator.lock().await.execute_pipeline().await?;
+        let pipeline_result = coordinator.lock().await.execute_pipeline().await;
+        
+        match pipeline_result {
+            Ok(_) => {
+                // Update step status to Completed
+                self.state_store
+                    .update_step_status(
+                        self.context.execution_id(),
+                        step_index,
+                        stepflow_core::status::StepStatus::Completed,
+                    )
+                    .await
+                    .change_context_lazy(|| ExecutionError::StateError)?;
+            }
+            Err(e) => {
+                // Update step status to Failed
+                self.state_store
+                    .update_step_status(
+                        self.context.execution_id(),
+                        step_index,
+                        stepflow_core::status::StepStatus::Failed,
+                    )
+                    .await
+                    .change_context_lazy(|| ExecutionError::StateError)?;
+                return Err(e);
+            }
+        }
 
         // Update dependency tracker
         self.tracker.complete_step(step_index);
@@ -807,6 +929,16 @@ impl WorkflowExecutor {
         let step = &self.flow.steps[step_index];
         let step_id = step.id.clone();
 
+        // Update step status to Running
+        self.state_store
+            .update_step_status(
+                self.context.execution_id(),
+                step_index,
+                stepflow_core::status::StepStatus::Running,
+            )
+            .await
+            .change_context_lazy(|| ExecutionError::StateError)?;
+
         // Resolve step inputs
         let step_input = match self.resolver.resolve(&step.input).await? {
             FlowResult::Success { result } => result,
@@ -831,6 +963,7 @@ impl WorkflowExecutor {
 
         // Execute streaming step in a loop
         let mut chunk_index = 0;
+        
         loop {
             let result = execute_step_async(plugin.clone(), step, step_input.clone(), self.context.clone()).await?;
             
@@ -858,6 +991,17 @@ impl WorkflowExecutor {
                 }
                 FlowResult::Failed { error } => {
                     tracing::error!("Streaming step {} failed: {:?}", step_id, error);
+                    
+                    // Update step status to Failed
+                    self.state_store
+                        .update_step_status(
+                            self.context.execution_id(),
+                            step_index,
+                            stepflow_core::status::StepStatus::Failed,
+                        )
+                        .await
+                        .change_context_lazy(|| ExecutionError::StateError)?;
+                    
                     return Err(ExecutionError::StepFailed { step: step_id }.into());
                 }
                 FlowResult::Skipped => {
@@ -867,6 +1011,16 @@ impl WorkflowExecutor {
             }
         }
 
+        // Update step status to Completed
+        self.state_store
+            .update_step_status(
+                self.context.execution_id(),
+                step_index,
+                stepflow_core::status::StepStatus::Completed,
+            )
+            .await
+            .change_context_lazy(|| ExecutionError::StateError)?;
+
         // Update dependency tracker for streaming step
         self.tracker.complete_step(step_index);
 
@@ -1198,15 +1352,26 @@ impl StreamingPipelineCoordinator {
 
                 // Continue processing if not final
                 if !is_final {
-                    // Wait for input from upstream steps
-                    while let Some(input_chunk) = receiver.recv().await {
-                        // Process the input chunk and continue streaming
-                        // This is where you'd call the step again with the new input
-                        tracing::debug!("Step {} received chunk, continuing stream", step_id);
-                        
-                        // For now, just continue the loop
-                        // In a full implementation, you'd call the step again
-                        break;
+                    // Wait for input from upstream steps with a timeout
+                    // This prevents infinite hanging if no chunks are sent
+                    let timeout = tokio::time::Duration::from_secs(30); // 30 second timeout
+                    match tokio::time::timeout(timeout, receiver.recv()).await {
+                        Ok(Some(input_chunk)) => {
+                            // Process the input chunk and continue streaming
+                            tracing::debug!("Step {} received chunk, continuing stream", step_id);
+                            
+                            // For now, just log the chunk and continue
+                            // In a full implementation, you'd call the step again with the new input
+                            tracing::debug!("Step {} processing chunk: {:?}", step_id, input_chunk);
+                        }
+                        Ok(None) => {
+                            // Channel closed, no more input expected
+                            tracing::debug!("Step {} input channel closed", step_id);
+                        }
+                        Err(_) => {
+                            // Timeout reached, no input received
+                            tracing::warn!("Step {} timed out waiting for input chunks", step_id);
+                        }
                     }
                 }
             }

From 77bac8250ae36fe427ccfe08e179bfee3bf095b3 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Tue, 24 Jun 2025 12:52:09 -0400
Subject: [PATCH 06/14] script file detection fix

---
 examples/test_audio_pipeline.sh | 38 ++++++++++++++++++++++++++-------
 1 file changed, 30 insertions(+), 8 deletions(-)

diff --git a/examples/test_audio_pipeline.sh b/examples/test_audio_pipeline.sh
index 5d72f5c5..6a6d16df 100755
--- a/examples/test_audio_pipeline.sh
+++ b/examples/test_audio_pipeline.sh
@@ -50,11 +50,21 @@ DURATION=${3:-"3.0"}
 OUTPUT_FILE=${4:-"test_workflow_webcam.wav"}
 DEVICE_NAME=${5:-"C922 Pro Stream Webcam"}
 
+# Determine the absolute path for the output file
+# The Python SDK runs from the examples directory, so it will create the file there
+if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
+    # Running from examples directory
+    ABSOLUTE_OUTPUT_FILE="$CURRENT_DIR/$OUTPUT_FILE"
+else
+    # Running from root directory
+    ABSOLUTE_OUTPUT_FILE="$SCRIPT_DIR/$OUTPUT_FILE"
+fi
+
 echo "🎵 Testing Audio Streaming Pipeline"
 echo "Source: $SOURCE"
 echo "Operation: $OPERATION"
 echo "Duration: ${DURATION}s"
-echo "Output: $OUTPUT_FILE"
+echo "Output: $ABSOLUTE_OUTPUT_FILE"
 echo "Device: $DEVICE_NAME"
 echo ""
 
@@ -69,7 +79,7 @@ cat > "$TEMP_INPUT" << EOF
   "chunk_size": 1024,
   "frequency": 440.0,
   "duration": $DURATION,
-  "output_file": "$OUTPUT_FILE",
+  "output_file": "$ABSOLUTE_OUTPUT_FILE",
   "device_name": "$DEVICE_NAME"
 }
 EOF
@@ -90,16 +100,28 @@ fi
 
 echo ""
 echo "✅ Test completed!"
-echo "📁 Output file: $OUTPUT_FILE"
+echo "📁 Output file: $ABSOLUTE_OUTPUT_FILE"
 
 # Check if file was created
-if [ -f "$OUTPUT_FILE" ]; then
+if [ -f "$ABSOLUTE_OUTPUT_FILE" ]; then
     echo "📊 File info:"
-    file "$OUTPUT_FILE"
-    echo "📏 File size: $(ls -lh $OUTPUT_FILE | awk '{print $5}')"
-    echo "🎵 Duration: $(soxi -D $OUTPUT_FILE 2>/dev/null || echo 'Unknown') seconds"
+    file "$ABSOLUTE_OUTPUT_FILE"
+    echo "📏 File size: $(ls -lh $ABSOLUTE_OUTPUT_FILE | awk '{print $5}')"
+    echo "🎵 Duration: $(soxi -D $ABSOLUTE_OUTPUT_FILE 2>/dev/null || echo 'Unknown') seconds"
 else
-    echo "❌ Output file not found"
+    # Check if file was created in examples directory (where Python SDK runs from)
+    EXAMPLES_OUTPUT_FILE="examples/$OUTPUT_FILE"
+    if [ -f "$EXAMPLES_OUTPUT_FILE" ]; then
+        echo "📊 File found in examples directory:"
+        file "$EXAMPLES_OUTPUT_FILE"
+        echo "📏 File size: $(ls -lh $EXAMPLES_OUTPUT_FILE | awk '{print $5}')"
+        echo "🎵 Duration: $(soxi -D $EXAMPLES_OUTPUT_FILE 2>/dev/null || echo 'Unknown') seconds"
+        echo "💡 Note: File was created in examples/ directory by the Python SDK"
+    else
+        echo "❌ Output file not found in expected location: $ABSOLUTE_OUTPUT_FILE"
+        echo "🔍 Checking for any .wav files in examples/ directory:"
+        find examples/ -name "*.wav" -type f 2>/dev/null || echo "No .wav files found in examples/"
+    fi
 fi
 
 # Clean up temporary input file

From e16461402ccdd3ccb2787c35c1576bfe3a3cef9f Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Tue, 24 Jun 2025 12:52:17 -0400
Subject: [PATCH 07/14] use channel not notificaiton

---
 .../src/workflow_executor.rs                  | 117 ++++++++++++++----
 .../src/stdio/recv_message_loop.rs            |  43 ++++++-
 2 files changed, 134 insertions(+), 26 deletions(-)

diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index 24fd0782..c43714e6 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -1059,14 +1059,31 @@ impl WorkflowExecutor {
             return Ok(());
         }
         
-        // Route the chunk to the first streaming step (source step)
-        // In a more sophisticated implementation, we'd route based on stream_id
-        if let Some(first_step_index) = streaming_steps.first() {
-            if let Some(coordinator) = &self.streaming_coordinator {
-                let mut coordinator = coordinator.lock().await;
-                coordinator.route_chunk_to_step(*first_step_index, chunk_content).await?;
-                tracing::debug!("Routed chunk to streaming step {}", first_step_index);
+        // Route the chunk to the pipeline coordinator if it exists
+        if let Some(coordinator) = &self.streaming_coordinator {
+            let mut coordinator = coordinator.lock().await;
+            
+            // Convert the notification chunk to a FlowResult::Streaming
+            let flow_result = FlowResult::Streaming {
+                stream_id: request_id.to_string(),
+                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!({})),
+                chunk: chunk_content.to_string(),
+                chunk_index: 0, // We don't have chunk index from notifications
+                is_final: false, // We don't know if it's final from notifications
+            };
+            
+            // Route to all active streaming steps in the pipeline
+            for &step_index in &streaming_steps {
+                if let Some(sender) = coordinator.step_connections.get(&step_index) {
+                    if let Err(e) = sender.send(flow_result.clone()).await {
+                        tracing::warn!("Failed to send chunk to step {}: {:?}", step_index, e);
+                    } else {
+                        tracing::debug!("Successfully routed chunk to streaming step {}", step_index);
+                    }
+                }
             }
+        } else {
+            tracing::warn!("No streaming coordinator found for chunk routing");
         }
         
         Ok(())
@@ -1258,6 +1275,7 @@ impl StreamingPipelineCoordinator {
         }
         
         // Wait for all streaming steps to complete
+        // Since streaming steps don't wait for input chunks anymore, they should complete quickly
         for task in tasks {
             task.await.map_err(|_e| ExecutionError::StepFailed { 
                 step: "streaming_pipeline".to_string() 
@@ -1334,8 +1352,15 @@ impl StreamingPipelineCoordinator {
 
         tracing::info!("Starting streaming step: {}", step_id);
 
-        // Execute the step to get initial result
-        let result = execute_step_async(plugin, step, step_input, context).await?;
+        // Execute the step to get initial result with a timeout
+        let timeout_duration = std::time::Duration::from_secs(10);
+        let result = match tokio::time::timeout(timeout_duration, execute_step_async(plugin.clone(), step, step_input.clone(), context.clone())).await {
+            Ok(result) => result?,
+            Err(_) => {
+                tracing::error!("Streaming step {} timed out after {} seconds", step_id, timeout_duration.as_secs());
+                return Err(ExecutionError::StepFailed { step: step_id }.into());
+            }
+        };
 
         match result {
             FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
@@ -1350,30 +1375,72 @@ impl StreamingPipelineCoordinator {
                     }).await;
                 }
 
-                // Continue processing if not final
-                if !is_final {
-                    // Wait for input from upstream steps with a timeout
-                    // This prevents infinite hanging if no chunks are sent
-                    let timeout = tokio::time::Duration::from_secs(30); // 30 second timeout
-                    match tokio::time::timeout(timeout, receiver.recv()).await {
-                        Ok(Some(input_chunk)) => {
-                            // Process the input chunk and continue streaming
-                            tracing::debug!("Step {} received chunk, continuing stream", step_id);
+                tracing::info!("Streaming step {} processed initial chunk, waiting for additional chunks", step_id);
+                
+                // Now wait for additional chunks to come through the channel
+                // These chunks are routed from the notification system
+                let mut chunk_count = 1;
+                let max_chunks = 1000; // Safety limit
+                
+                while chunk_count < max_chunks {
+                    // Wait for chunks with a timeout
+                    match tokio::time::timeout(std::time::Duration::from_secs(5), receiver.recv()).await {
+                        Ok(Some(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final })) => {
+                            chunk_count += 1;
+                            tracing::debug!("Streaming step {} received chunk {}: stream_id={}, is_final={}", 
+                                step_id, chunk_count, stream_id, is_final);
+                            
+                            // Process the chunk by calling the step again
+                            let chunk_input = stepflow_core::workflow::ValueRef::new(serde_json::json!({
+                                "chunk": chunk,
+                                "stream_id": stream_id,
+                                "chunk_index": chunk_index,
+                                "is_final": is_final,
+                                "metadata": metadata.as_ref()
+                            }));
+                            
+                            let chunk_result = match tokio::time::timeout(
+                                std::time::Duration::from_secs(5), 
+                                execute_step_async(plugin.clone(), step, chunk_input, context.clone())
+                            ).await {
+                                Ok(result) => result?,
+                                Err(_) => {
+                                    tracing::warn!("Streaming step {} chunk processing timed out", step_id);
+                                    continue;
+                                }
+                            };
                             
-                            // For now, just log the chunk and continue
-                            // In a full implementation, you'd call the step again with the new input
-                            tracing::debug!("Step {} processing chunk: {:?}", step_id, input_chunk);
+                            // Send the processed chunk to downstream steps
+                            for sender in &downstream_senders {
+                                let _ = sender.send(chunk_result.clone()).await;
+                            }
+                            
+                            // If this is the final chunk, we're done
+                            if is_final {
+                                tracing::info!("Streaming step {} received final chunk, completing", step_id);
+                                break;
+                            }
+                        }
+                        Ok(Some(_)) => {
+                            // Received non-streaming result, ignore
+                            continue;
                         }
                         Ok(None) => {
-                            // Channel closed, no more input expected
-                            tracing::debug!("Step {} input channel closed", step_id);
+                            // Channel closed, we're done
+                            tracing::info!("Streaming step {} channel closed, completing", step_id);
+                            break;
                         }
                         Err(_) => {
-                            // Timeout reached, no input received
-                            tracing::warn!("Step {} timed out waiting for input chunks", step_id);
+                            // Timeout - no more chunks for now
+                            tracing::debug!("Streaming step {} no more chunks after timeout", step_id);
+                            break;
                         }
                     }
                 }
+                
+                if chunk_count >= max_chunks {
+                    tracing::warn!("Streaming step {} reached maximum chunk limit ({})", step_id, max_chunks);
+                }
             }
             FlowResult::Success { result } => {
                 tracing::info!("Streaming step {} completed with success", step_id);
diff --git a/crates/stepflow-protocol/src/stdio/recv_message_loop.rs b/crates/stepflow-protocol/src/stdio/recv_message_loop.rs
index b296535e..ab4d2809 100644
--- a/crates/stepflow-protocol/src/stdio/recv_message_loop.rs
+++ b/crates/stepflow-protocol/src/stdio/recv_message_loop.rs
@@ -33,6 +33,8 @@ impl ReceiveMessageLoop {
 
         let to_child = child.stdin.take().expect("stdin requested");
         let from_child_stdout = child.stdout.take().expect("stdout requested");
+        
+        // Use BufReader with default capacity - it will automatically handle large messages
         let from_child_stdout = LinesStream::new(BufReader::new(from_child_stdout).lines());
 
         let from_child_stderr = child.stderr.take().expect("stderr requested");
@@ -92,8 +94,47 @@ impl ReceiveMessageLoop {
             }
             Some(line) = self.from_child_stdout.next() => {
                 let line = line.change_context(StdioError::Recv)?;
+                
+                // Check if the line is suspiciously long (might indicate truncation)
+                if line.len() > 1024 * 1024 {
+                    tracing::warn!("Received very long message ({} chars), may be truncated", line.len());
+                }
+                
                 tracing::info!("Received line from child: {line:?}");
-                let msg = OwnedIncoming::try_new(line).change_context(StdioError::Recv)?;
+                
+                // Add better error handling for JSON parsing
+                let msg = match OwnedIncoming::try_new(line.clone()) {
+                    Ok(msg) => msg,
+                    Err(e) => {
+                        tracing::error!("Failed to parse JSON message: {}", e);
+                        tracing::error!("Message length: {} characters", line.len());
+                        
+                        // Check if the JSON appears to be truncated
+                        if !line.trim().ends_with('}') {
+                            tracing::error!("JSON appears to be truncated - doesn't end with '}}'");
+                        }
+                        
+                        // Check for common JSON syntax issues
+                        let open_braces = line.chars().filter(|&c| c == '{').count();
+                        let close_braces = line.chars().filter(|&c| c == '}').count();
+                        if open_braces != close_braces {
+                            tracing::error!("JSON brace mismatch: {} opening, {} closing", open_braces, close_braces);
+                        }
+                        
+                        if line.len() > 1000 {
+                            tracing::error!("Message preview (first 500 chars): {}", &line[..500]);
+                            tracing::error!("Message preview (last 500 chars): {}", &line[line.len()-500..]);
+                        } else {
+                            tracing::error!("Full message: {}", line);
+                        }
+                        
+                        // Instead of returning an error and terminating the loop,
+                        // log the error and continue processing other messages
+                        tracing::warn!("Skipping malformed message and continuing...");
+                        return Ok(true);
+                    }
+                };
+                
                 match (msg.method, msg.params, msg.id) {
                     (Some(method), Some(params), _) => {
                         // Incoming method call or notification.

From f9950ccae0674353ab5868a5c676ea5704ffa406 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Thu, 26 Jun 2025 00:18:55 -0400
Subject: [PATCH 08/14] wip

---
 Cargo.lock                                    |    1 +
 crates/stepflow-core/src/flow_result.rs       |    6 +
 crates/stepflow-core/src/workflow/step.rs     |    2 +-
 crates/stepflow-execution/src/executor.rs     |   78 +-
 .../stepflow-execution/src/value_resolver.rs  |    5 +
 .../src/workflow_executor.rs                  | 1066 ++++++++++++-----
 crates/stepflow-plugin/src/context.rs         |   14 +
 crates/stepflow-protocol/Cargo.toml           |    1 +
 crates/stepflow-protocol/src/blob_handlers.rs |   78 +-
 .../stepflow-protocol/src/incoming_handler.rs |    3 +
 .../src/schema/component_execute.rs           |    3 +
 crates/stepflow-protocol/src/stdio/client.rs  |    1 +
 crates/stepflow-protocol/src/stdio/plugin.rs  |   99 +-
 .../src/stdio/recv_message_loop.rs            |  143 ++-
 examples/audio-streaming-pipeline.yaml        |    7 +-
 examples/audio_input.json                     |    2 +-
 examples/test_audio_pipeline.sh               |   29 +-
 .../src/stepflow_sdk/audio_components.py      |  403 ++++---
 sdks/python/src/stepflow_sdk/protocol.py      |    2 +
 sdks/python/src/stepflow_sdk/server.py        |   33 +-
 20 files changed, 1451 insertions(+), 525 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 06e10894..720ea251 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -3020,6 +3020,7 @@ dependencies = [
  "serde",
  "serde_json",
  "stepflow-core",
+ "stepflow-execution",
  "stepflow-plugin",
  "thiserror 2.0.12",
  "tokio",
diff --git a/crates/stepflow-core/src/flow_result.rs b/crates/stepflow-core/src/flow_result.rs
index 5c6af92d..8d564b80 100644
--- a/crates/stepflow-core/src/flow_result.rs
+++ b/crates/stepflow-core/src/flow_result.rs
@@ -70,6 +70,12 @@ pub enum FlowResult {
 
 impl From<serde_json::Value> for FlowResult {
     fn from(value: serde_json::Value) -> Self {
+        // First try to deserialize as a proper FlowResult
+        if let Ok(flow_result) = serde_json::from_value::<FlowResult>(value.clone()) {
+            return flow_result;
+        }
+
+        // If that fails, wrap in Success as fallback
         let result = ValueRef::new(value);
         Self::Success { result }
     }
diff --git a/crates/stepflow-core/src/workflow/step.rs b/crates/stepflow-core/src/workflow/step.rs
index a529ad7e..14829f67 100644
--- a/crates/stepflow-core/src/workflow/step.rs
+++ b/crates/stepflow-core/src/workflow/step.rs
@@ -3,7 +3,7 @@ use crate::schema::SchemaRef;
 use schemars::JsonSchema;
 
 /// A step in a workflow that executes a component with specific arguments.
-#[derive(serde::Serialize, serde::Deserialize, Debug, PartialEq, JsonSchema, utoipa::ToSchema)]
+#[derive(Clone, serde::Serialize, serde::Deserialize, Debug, PartialEq, JsonSchema, utoipa::ToSchema)]
 #[serde(rename_all = "camelCase")]
 pub struct Step {
     /// Optional identifier for the step
diff --git a/crates/stepflow-execution/src/executor.rs b/crates/stepflow-execution/src/executor.rs
index a28ec5ed..463e7cb2 100644
--- a/crates/stepflow-execution/src/executor.rs
+++ b/crates/stepflow-execution/src/executor.rs
@@ -11,7 +11,7 @@ use stepflow_core::{
 };
 use stepflow_plugin::{Context, DynPlugin, ExecutionContext, Plugin as _};
 use stepflow_state::{InMemoryStateStore, StateStore};
-use tokio::sync::{RwLock, oneshot};
+use tokio::sync::{RwLock, oneshot, Mutex};
 use uuid::Uuid;
 
 type FutureFlowResult = futures::future::Shared<oneshot::Receiver<FlowResult>>;
@@ -25,7 +25,7 @@ pub struct StepFlowExecutor {
     // TODO: Should write execution state to the state store for persistence.
     pending: Arc<RwLock<HashMap<Uuid, FutureFlowResult>>>,
     /// Active debug sessions for step-by-step execution control
-    debug_sessions: Arc<RwLock<HashMap<Uuid, WorkflowExecutor>>>,
+    debug_sessions: Arc<RwLock<HashMap<Uuid, Arc<Mutex<WorkflowExecutor>>>>>,
     // Keep a weak reference to self for spawning tasks without circular references
     self_weak: std::sync::Weak<Self>,
 }
@@ -155,20 +155,11 @@ impl StepFlowExecutor {
     pub async fn get_workflow_executor(
         &self,
         execution_id: Uuid,
-    ) -> Result<Option<WorkflowExecutor>> {
+    ) -> Result<Option<Arc<Mutex<WorkflowExecutor>>>> {
         let debug_sessions = self.debug_sessions.read().await;
         Ok(debug_sessions.get(&execution_id).cloned())
     }
 
-    /// Get a mutable workflow executor for debug sessions
-    pub async fn get_workflow_executor_mut(
-        &self,
-        execution_id: Uuid,
-    ) -> Result<Option<WorkflowExecutor>> {
-        let mut debug_sessions = self.debug_sessions.write().await;
-        Ok(debug_sessions.get_mut(&execution_id).cloned())
-    }
-
     /// Get the flow for a specific execution (for streaming pipeline coordinator)
     pub fn flow(&self) -> Option<Arc<Flow>> {
         // This is a placeholder - in a real implementation, we'd need to store flows
@@ -208,18 +199,38 @@ impl Context for StepFlowExecutor {
                 pending.insert(execution_id, rx.shared());
             }
 
+            // Create the WorkflowExecutor and store it in debug_sessions for streaming access
+            // TODO: Consider using a separate `active_executions` map instead of `debug_sessions` 
+            // for normal execution, to keep debug sessions separate from streaming access
+            let workflow_executor = WorkflowExecutor::new(
+                executor.clone(),
+                flow.clone(),
+                workflow_hash.clone(),
+                execution_id,
+                input.clone(),
+                executor.state_store().clone(),
+            ).map_err(|e| stepflow_plugin::PluginError::new(format!("Failed to create workflow executor: {:?}", e)))
+                .change_context(stepflow_plugin::PluginError::new("Failed to create workflow executor"))?;
+
+            // Store in debug_sessions for streaming chunk access
+            {
+                let mut debug_sessions = self.debug_sessions.write().await;
+                debug_sessions.insert(execution_id, Arc::new(Mutex::new(workflow_executor)));
+                tracing::info!("Stored WorkflowExecutor in debug_sessions for execution ID: {}", execution_id);
+            }
+
             // Spawn the execution
             tokio::spawn(async move {
                 tracing::info!("Executing workflow using tracker-based execution");
                 let state_store = executor.state_store.clone();
 
                 let result = execute_workflow(
-                    executor,
-                    flow,
+                    executor.clone(),
+                    flow.clone(),
                     workflow_hash,
                     execution_id,
                     input,
-                    state_store,
+                    state_store.clone(),
                 )
                 .await;
 
@@ -242,6 +253,14 @@ impl Context for StepFlowExecutor {
 
                 // Send the result back
                 let _ = tx.send(flow_result);
+
+                // Clean up the debug session immediately after execution completes
+                // This prevents unbounded growth of the debug_sessions map
+                {
+                    let mut debug_sessions = executor.debug_sessions.write().await;
+                    debug_sessions.remove(&execution_id);
+                    tracing::debug!("Cleaned up debug session for execution {}", execution_id);
+                }
             });
 
             Ok(execution_id)
@@ -265,15 +284,26 @@ impl Context for StepFlowExecutor {
         let pending = self.pending.clone();
 
         async move {
-            let pending = pending.read().await;
-            let future = pending
-                .get(&execution_id)
-                .ok_or_else(|| stepflow_plugin::PluginError::new("Execution not found"))
-                .change_context(stepflow_plugin::PluginError::new("Execution not found"))?
-                .clone();
-
-            future.await.map_err(|_| stepflow_plugin::PluginError::new("Execution failed"))
-                .change_context(stepflow_plugin::PluginError::new("Execution failed"))
+            let future = {
+                let pending = pending.read().await;
+                pending
+                    .get(&execution_id)
+                    .ok_or_else(|| stepflow_plugin::PluginError::new("Execution not found"))
+                    .change_context(stepflow_plugin::PluginError::new("Execution not found"))?
+                    .clone()
+            };
+
+            let result = future.await.map_err(|_| stepflow_plugin::PluginError::new("Execution failed"))
+                .change_context(stepflow_plugin::PluginError::new("Execution failed"));
+
+            // Clean up the pending entry after getting the result to prevent memory leaks
+            {
+                let mut pending_write = pending.write().await;
+                pending_write.remove(&execution_id);
+                tracing::debug!("Cleaned up pending execution {}", execution_id);
+            }
+
+            result
         }
         .boxed()
     }
diff --git a/crates/stepflow-execution/src/value_resolver.rs b/crates/stepflow-execution/src/value_resolver.rs
index cdb804f9..f11af293 100644
--- a/crates/stepflow-execution/src/value_resolver.rs
+++ b/crates/stepflow-execution/src/value_resolver.rs
@@ -35,6 +35,11 @@ impl ValueResolver {
         }
     }
 
+    /// Get the workflow input for this resolver.
+    pub fn workflow_input(&self) -> &ValueRef {
+        &self.input
+    }
+
     /// Resolve a ValueRef, returning a FlowResult.
     /// This is the main entry point for value resolution.
     pub async fn resolve(&self, value: &ValueRef) -> Result<FlowResult> {
diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index c43714e6..e487cec0 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -12,10 +12,17 @@ use stepflow_core::{
 use stepflow_plugin::{DynPlugin, ExecutionContext, Plugin as _};
 use stepflow_state::{StateStore, StepResult};
 use uuid::Uuid;
-use tokio::sync::{mpsc, oneshot};
+use tokio::sync::mpsc;
 
 use crate::{ExecutionError, Result, StepFlowExecutor, value_resolver::ValueResolver};
 
+/// Helper macro for streaming step logging
+macro_rules! stream_log {
+    ($level:ident, $step_id:expr, $($arg:tt)*) => {
+        tracing::$level!("[STREAM {}] {}", $step_id, format!($($arg)*))
+    };
+}
+
 /// Execute a workflow and return the result.
 pub(crate) async fn execute_workflow(
     executor: Arc<StepFlowExecutor>,
@@ -41,7 +48,6 @@ pub(crate) async fn execute_workflow(
 ///
 /// This serves as the core execution engine that can be used directly for
 /// run-to-completion execution, or controlled step-by-step by the debug session.
-#[derive(Clone)]
 pub struct WorkflowExecutor {
     /// Dependency tracker for determining runnable steps
     tracker: stepflow_analysis::DependencyTracker,
@@ -56,7 +62,7 @@ pub struct WorkflowExecutor {
     /// Execution context for this session
     context: ExecutionContext,
     /// Optional streaming pipeline coordinator
-    streaming_coordinator: Option<std::sync::Arc<tokio::sync::Mutex<StreamingPipelineCoordinator>>>,
+    streaming_coordinator: Option<Arc<tokio::sync::Mutex<StreamingPipelineCoordinator>>>,
 }
 
 impl WorkflowExecutor {
@@ -85,20 +91,37 @@ impl WorkflowExecutor {
 
         // Initialize streaming coordinator if workflow has streaming steps
         let streaming_coordinator = if flow.steps.iter().any(|step| step.streaming) {
-            let pipeline_steps: Vec<usize> = flow.steps.iter()
+            let mut pipeline_steps: Vec<usize> = flow.steps.iter()
                 .enumerate()
                 .filter(|(_, step)| step.streaming)
                 .map(|(index, _)| index)
                 .collect();
             
             if !pipeline_steps.is_empty() {
+                // Log the initial order (source order)
+                tracing::info!("Initial pipeline order (source order): {:?}",
+                    pipeline_steps.iter().map(|i| &flow.steps[*i].id).collect::<Vec<_>>()
+                );
+                
+                // Sort pipeline steps by dependencies using a topological sort
+                pipeline_steps = sort_streaming_steps_by_dependencies(&flow, pipeline_steps)?;
+                
+                // Log the final pipeline order to verify it's correct
+                tracing::info!("Final pipeline will run in this order: {:?}",
+                    pipeline_steps.iter().map(|i| &flow.steps[*i].id).collect::<Vec<_>>()
+                );
+                tracing::info!("Pipeline step indices and components: {:?}",
+                    pipeline_steps.iter().map(|i| (*i, &flow.steps[*i].id, &flow.steps[*i].component)).collect::<Vec<_>>()
+                );
+                
                 let coordinator = StreamingPipelineCoordinator::new(
                     executor.clone(),
                     flow.clone(),
                     pipeline_steps,
                     context.clone(),
+                    resolver.clone(),
                 );
-                Some(std::sync::Arc::new(tokio::sync::Mutex::new(coordinator)))
+                Some(Arc::new(tokio::sync::Mutex::new(coordinator)))
             } else {
                 None
             }
@@ -127,6 +150,17 @@ impl WorkflowExecutor {
         &self.flow
     }
 
+    /// Check if the streaming pipeline is still active (has active receivers)
+    pub fn is_streaming_pipeline_active(&self) -> bool {
+        if let Some(coord_arc) = &self.streaming_coordinator {
+            // For now, just check if coordinator exists - we can't easily check receivers without async
+            true
+        } else {
+            // No coordinator means no streaming pipeline
+            false
+        }
+    }
+
     /// Get currently runnable step indices.
     pub fn get_runnable_step_indices(&self) -> BitSet {
         self.tracker.unblocked_steps()
@@ -139,6 +173,19 @@ impl WorkflowExecutor {
 
         tracing::debug!("Starting execution of {} steps", self.flow.steps.len());
 
+        // Start streaming pipeline coordinator concurrently if it exists
+        let streaming_task = if let Some(coordinator_arc) = &self.streaming_coordinator {
+            tracing::info!("Starting streaming pipeline coordinator concurrently with main execution");
+            
+            let coord = coordinator_arc.clone();
+            // Start the pipeline execution in a separate task (single-phase, no setup needed)
+            Some(tokio::spawn(async move {
+                StreamingPipelineCoordinator::run_pipeline_without_lock(coord).await
+            }))
+        } else {
+            None
+        };
+
         // Start initial unblocked steps
         let initial_unblocked = self.tracker.unblocked_steps();
         tracing::debug!(
@@ -201,7 +248,23 @@ impl WorkflowExecutor {
                 .await?;
         }
 
-        // All tasks completed - try to complete the workflow
+        // Wait for streaming pipeline to complete if it was started
+        if let Some(streaming_task) = streaming_task {
+            tracing::info!("Waiting for streaming pipeline coordinator to complete");
+            match streaming_task.await {
+                Ok(result) => {
+                    if let Err(e) = result {
+                        tracing::warn!("Streaming pipeline coordinator completed with error: {:?}", e);
+                    } else {
+                        tracing::info!("Streaming pipeline coordinator completed successfully");
+                    }
+                }
+                Err(e) => {
+                    tracing::warn!("Streaming pipeline coordinator task panicked: {:?}", e);
+                }
+            }
+        }
+
         self.resolve_workflow_output().await
     }
 
@@ -515,36 +578,36 @@ impl WorkflowExecutor {
             }
         };
 
-        // Get plugin and execute the step
-        let plugin = self.executor.get_plugin(&step.component).await?;
-        let result = execute_step_async(plugin, step, step_input, self.context.clone()).await?;
-
-        // Update step status based on result
-        let final_status = match &result {
-            FlowResult::Success { .. } => stepflow_core::status::StepStatus::Completed,
-            FlowResult::Failed { .. } => stepflow_core::status::StepStatus::Failed,
-            FlowResult::Skipped => stepflow_core::status::StepStatus::Skipped,
-            FlowResult::Streaming { .. } => stepflow_core::status::StepStatus::Running, // Keep as running for streaming
-        };
-
-        self.state_store
-            .update_step_status(
-                self.context.execution_id(),
-                step_index,
-                final_status,
-            )
-            .await
-            .change_context_lazy(|| ExecutionError::StateError)?;
-
-        // For streaming steps, don't record in state store
+        // Check if this is a streaming step
         if step.streaming {
-            // Update dependency tracker but don't persist
-            self.tracker.complete_step(step_index);
-        } else {
-            // Record the result for non-streaming steps
-            self.record_step_completion(step_index, &result).await?;
+            tracing::info!("Step {} is a streaming step, using streaming execution", step.id);
+            // For streaming steps, return a StepExecutionResult with a placeholder Streaming result
+            let streaming_result = FlowResult::Streaming {
+                stream_id: format!("stream_{}", step.id),
+                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!({
+                    "step_id": step.id,
+                    "step_index": step_index,
+                    "streaming": true
+                })),
+                chunk: "".to_string(),
+                chunk_index: 0,
+                is_final: false,
+            };
+            return Ok(StepExecutionResult::new(
+                step_index,
+                step_id,
+                component_string,
+                streaming_result,
+            ));
         }
 
+        // Regular non-streaming step execution
+        let plugin = self.executor.get_plugin(&step.component).await?;
+        let flow = self.flow.clone();
+        let context = self.context.clone()
+            .with_step(self.flow.steps[step_index].id.clone());
+        let step = &flow.steps[step_index];
+        let result = execute_step_async(plugin, step, step_input, context).await?;
         Ok(StepExecutionResult::new(
             step_index,
             step_id,
@@ -744,17 +807,25 @@ impl WorkflowExecutor {
             .await
             .change_context_lazy(|| ExecutionError::StateError)?;
 
-        // Get plugin for this step
+        // Check if this is a streaming step
+        if step.streaming {
+            tracing::info!("Step {} is a streaming step, using streaming execution", step.id);
+            // For streaming steps, just mark as running; the coordinator will handle execution
+            return Ok(());
+        }
+
+        // Regular non-streaming step execution
         let plugin = self.executor.get_plugin(&step.component).await?;
 
         // Clone necessary data for the async task
         let flow = self.flow.clone();
-        let context = self.context.clone();
+        let context = self.context.clone()
+            .with_step(self.flow.steps[step_index].id.clone());
 
         // Create the async task
         let task_future: BoxFuture<'static, (usize, Result<FlowResult>)> = Box::pin(async move {
             let step = &flow.steps[step_index];
-            let result = execute_step_async(plugin, step, step_input, context).await;
+            let result = execute_step_async(plugin.clone(), step, step_input, context).await;
             (step_index, result)
         });
 
@@ -838,20 +909,12 @@ impl WorkflowExecutor {
             .await
             .change_context_lazy(|| ExecutionError::StateError)?;
 
-        // Find all streaming steps in the pipeline
-        let pipeline_steps = self.find_streaming_pipeline_steps(step_index);
-        
-        // Create a streaming coordinator and store it
-        let coordinator = std::sync::Arc::new(tokio::sync::Mutex::new(StreamingPipelineCoordinator::new(
-            self.executor.clone(),
-            self.flow.clone(),
-            pipeline_steps,
-            self.context.clone(),
-        )));
-        self.streaming_coordinator = Some(coordinator.clone());
-
-        // Execute the entire pipeline
-        let pipeline_result = coordinator.lock().await.execute_pipeline().await;
+        // Reuse the coordinator created in WorkflowExecutor::new
+        let pipeline_result = if let Some(coord_arc) = &self.streaming_coordinator {
+            StreamingPipelineCoordinator::run_pipeline_without_lock(coord_arc.clone()).await
+        } else {
+            return Err(ExecutionError::Internal.into());
+        };
         
         match pipeline_result {
             Ok(_) => {
@@ -961,33 +1024,86 @@ impl WorkflowExecutor {
         // Get plugin
         let plugin = self.executor.get_plugin(&step.component).await?;
 
-        // Execute streaming step in a loop
-        let mut chunk_index = 0;
+        // For streaming steps, we need to:
+        // 1. Call the step once to start the generator
+        // 2. Wait for streaming chunks to come through the notification system
+        // 3. Process each chunk as it arrives
+        // 4. Stop when the final chunk arrives
         
-        loop {
-            let result = execute_step_async(plugin.clone(), step, step_input.clone(), self.context.clone()).await?;
+        tracing::info!("[streaming] Starting streaming step {} with initial call", step_id);
+        
+        // Initial call to start the generator
+        let initial_result = execute_step_async(plugin.clone(), step, step_input.clone(), self.context.clone().with_step(step.id.clone())).await?;
             
-            match result {
-                FlowResult::Streaming { stream_id, metadata, chunk, chunk_index: _, is_final } => {
-                    // Process the streaming chunk
-                    tracing::debug!(
-                        "Streaming step {} chunk {}: stream_id={}, is_final={}",
-                        step_id, chunk_index, stream_id, is_final
-                    );
-                    
-                    // Here you could emit the chunk to downstream steps or external consumers
-                    // For now, we just log it
+        match initial_result {
+            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+                tracing::info!("[streaming] Step {} started generator, received initial chunk (index={}, is_final={})", step_id, chunk_index, is_final);
+
+
+                // Process the initial chunk
+                    let mut chunk_input_data = step_input.as_ref().clone();
+                    if let serde_json::Value::Object(ref mut map) = chunk_input_data {
+                        map.insert("chunk".to_string(), serde_json::Value::String(chunk.clone()));
+                        map.insert("stream_id".to_string(), serde_json::Value::String(stream_id.clone()));
+                        map.insert("chunk_index".to_string(), serde_json::Value::Number(chunk_index.into()));
+                        map.insert("is_final".to_string(), serde_json::Value::Bool(is_final));
+                        if let Some(metadata_obj) = metadata.as_ref().as_object() {
+                            for (key, value) in metadata_obj {
+                                map.insert(key.clone(), value.clone());
+                            }
+                        }
+                    }
+                    let chunk_input = stepflow_core::workflow::ValueRef::new(chunk_input_data);
                     
-                    chunk_index += 1;
+                    let chunk_result = match tokio::time::timeout(
+                        std::time::Duration::from_secs(5), 
+                        execute_step_async(plugin.clone(), step, chunk_input, self.context.clone().with_step(step.id.clone()))
+                    ).await {
+                        Ok(result) => result?,
+                        Err(_) => {
+                        tracing::warn!("[streaming] Step {} initial chunk processing timed out", step_id);
+                        // Return a default result for timeout case
+                        FlowResult::Success {
+                            result: stepflow_core::workflow::ValueRef::new(serde_json::json!({
+                                "error": "timeout",
+                                "message": "Initial chunk processing timed out"
+                            }))
+                        }
+                        }
+                    };
                     
+                    // If this is the final chunk, we're done
                     if is_final {
-                        break;
+                    tracing::info!("[streaming] Step {} completed with final chunk from initial call", step_id);
+                } else {
+                    // Wait for additional chunks to come through the streaming notification system
+                    // The chunks will be routed via route_streaming_chunk method
+                    tracing::info!("[streaming] Step {} waiting for additional chunks via streaming notifications", step_id);
+                    
+                    // For now, we'll wait a reasonable amount of time for chunks to arrive
+                    // In a more sophisticated implementation, we'd have a proper notification system
+                    let mut chunk_count = 1;
+                    let max_wait_time = std::time::Duration::from_secs(30); // Wait up to 30 seconds
+                    let start_time = std::time::Instant::now();
+                    
+                    while start_time.elapsed() < max_wait_time {
+                        // Sleep briefly to allow chunks to be processed
+                        tokio::time::sleep(std::time::Duration::from_millis(100)).await;
+                        
+                        // Check if we should continue waiting
+                        // This is a simplified approach - in practice, we'd have proper notification handling
+                        chunk_count += 1;
+                        if chunk_count % 100 == 0 {
+                            tracing::debug!("[streaming] Step {} still waiting for chunks, elapsed: {:?}", step_id, start_time.elapsed());
+                        }
+                    }
+                    
+                    tracing::info!("[streaming] Step {} finished waiting for chunks, elapsed: {:?}", step_id, start_time.elapsed());
                     }
                 }
                 FlowResult::Success { result } => {
                     // Non-streaming result, treat as final
                     tracing::debug!("Streaming step {} completed with success", step_id);
-                    break;
                 }
                 FlowResult::Failed { error } => {
                     tracing::error!("Streaming step {} failed: {:?}", step_id, error);
@@ -1006,8 +1122,6 @@ impl WorkflowExecutor {
                 }
                 FlowResult::Skipped => {
                     tracing::debug!("Streaming step {} skipped", step_id);
-                    break;
-                }
             }
         }
 
@@ -1029,89 +1143,39 @@ impl WorkflowExecutor {
 
     /// Route a streaming chunk to the appropriate streaming pipeline
     pub async fn route_streaming_chunk(&mut self, chunk: serde_json::Value) -> Result<()> {
-        tracing::debug!("Routing streaming chunk to workflow executor");
-        
-        // Parse the chunk to extract request_id and chunk data
-        let chunk_data = match serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk.clone()) {
-            Ok(data) => data,
-            Err(e) => {
-                tracing::error!("Failed to parse streaming chunk: {}", e);
-                return Ok(());
-            }
-        };
+        tracing::info!("ROUTE_CHUNK[exec={} addr={:p}] called", self.execution_id(), self as *const _);
         
-        // Extract request_id and chunk content
-        let request_id = chunk_data.get("request_id")
-            .and_then(|v| v.as_str())
-            .unwrap_or("unknown");
-        
-        let chunk_content = chunk_data.get("chunk")
-            .cloned()
-            .unwrap_or(serde_json::Value::Null);
-        
-        tracing::debug!("Routing chunk for request {}: {:?}", request_id, chunk_content);
-        
-        // Find streaming steps that are currently active
-        let streaming_steps = self.find_active_streaming_steps().await?;
-        
-        if streaming_steps.is_empty() {
-            tracing::warn!("No active streaming steps found for chunk routing");
-            return Ok(());
-        }
-        
-        // Route the chunk to the pipeline coordinator if it exists
-        if let Some(coordinator) = &self.streaming_coordinator {
-            let mut coordinator = coordinator.lock().await;
-            
-            // Convert the notification chunk to a FlowResult::Streaming
-            let flow_result = FlowResult::Streaming {
-                stream_id: request_id.to_string(),
-                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!({})),
-                chunk: chunk_content.to_string(),
-                chunk_index: 0, // We don't have chunk index from notifications
-                is_final: false, // We don't know if it's final from notifications
-            };
-            
-            // Route to all active streaming steps in the pipeline
-            for &step_index in &streaming_steps {
-                if let Some(sender) = coordinator.step_connections.get(&step_index) {
-                    if let Err(e) = sender.send(flow_result.clone()).await {
-                        tracing::warn!("Failed to send chunk to step {}: {:?}", step_index, e);
-                    } else {
-                        tracing::debug!("Successfully routed chunk to streaming step {}", step_index);
-                    }
-                }
-            }
+        if let Some(coord_arc) = &self.streaming_coordinator {
+            // Route chunks directly to the coordinator used by run_pipeline_without_lock
+            // This ensures chunks are sent to the same channels that the step tasks are listening on
+            StreamingPipelineCoordinator::route_chunk_to_running_pipeline(coord_arc.clone(), chunk).await?;
         } else {
-            tracing::warn!("No streaming coordinator found for chunk routing");
+            tracing::warn!("No streaming pipeline active for exec {}", self.execution_id());
         }
-        
         Ok(())
     }
     
-    /// Find currently active streaming steps
-    async fn find_active_streaming_steps(&self) -> Result<Vec<usize>> {
+    /// Find currently active streaming steps using in-memory workflow information
+    /// This avoids depending on state store data that might be cleaned up
+    fn find_active_streaming_steps_in_memory(&self) -> Vec<usize> {
         let mut active_steps = Vec::new();
         
         for (step_index, step) in self.flow.steps.iter().enumerate() {
             if step.streaming {
-                // Check if this step is currently running or ready to run
-                let step_status = self.state_store
-                    .get_step_status(self.execution_id(), step_index)
-                    .await
-                    .map_err(|e| error_stack::report!(ExecutionError::StateError).attach_printable(format!("State error: {e}")))?;
-                match step_status {
-                    stepflow_core::status::StepStatus::Running | 
-                    stepflow_core::status::StepStatus::Runnable => {
-                        active_steps.push(step_index);
-                    }
-                    _ => {}
+                // For streaming steps, assume they are active if they exist in the coordinator
+                if let Some(_coord_arc) = &self.streaming_coordinator {
+                    // For now, just assume all streaming steps are active
+                    // We can't easily check step_receivers without async
+                    active_steps.push(step_index);
+                    tracing::debug!("Found active streaming step {} in coordinator", step_index);
                 }
             }
         }
         
-        Ok(active_steps)
+        tracing::debug!("Found {} active streaming steps: {:?}", active_steps.len(), active_steps);
+        active_steps
     }
+
 }
 
 /// Execute a single step asynchronously.
@@ -1213,25 +1277,163 @@ struct StreamingPipelineCoordinator {
     flow: Arc<Flow>,
     pipeline_steps: Vec<usize>,
     context: ExecutionContext,
-    step_connections: std::collections::HashMap<usize, tokio::sync::mpsc::Sender<FlowResult>>,
-    step_receivers: std::collections::HashMap<usize, tokio::sync::mpsc::Receiver<FlowResult>>,
+    resolver: ValueResolver,
+    step_receivers: std::collections::HashMap<String, mpsc::Receiver<FlowResult>>,
+    step_downstream_senders: std::collections::HashMap<String, Vec<mpsc::Sender<FlowResult>>>,
+    step_senders: std::collections::HashMap<String, mpsc::Sender<FlowResult>>,
 }
 
 impl StreamingPipelineCoordinator {
+    /// Route chunks to the running pipeline without requiring mutable access to the coordinator
+    /// This allows chunks to be routed while the receivers are moved out for step tasks
+    pub async fn route_chunk_to_running_pipeline(
+        coord_arc: Arc<tokio::sync::Mutex<Self>>,
+        chunk_json: serde_json::Value,
+    ) -> Result<()> {
+        let map = serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk_json)
+            .map_err(|e| ExecutionError::MalformedReference { message: e.to_string() })?;
+        
+        let coord = coord_arc.lock().await;
+        
+        // Extract the step ID this chunk belongs to (default to first pipeline step)
+        let step_id = map.get("step_id")
+                          .and_then(|v| v.as_str())
+                          .map(|s| s.to_string())
+                          .unwrap_or_else(|| {
+                              // Default to first step (source step) if no step_id provided
+                              let first_step_idx = coord.pipeline_steps[0];
+                              let first_step_id = coord.flow.steps[first_step_idx].id.clone();
+                              tracing::info!("No step_id in chunk, defaulting to first pipeline step: {}", first_step_id);
+                              first_step_id
+                          });
+                          
+        let stream_id   = map.get("stream_id")  .and_then(|v| v.as_str()).unwrap_or_default().to_string();
+        let chunk_index = map.get("chunk_index").and_then(|v| v.as_u64()).unwrap_or(0) as usize;
+        let is_final    = map.get("is_final")   .and_then(|v| v.as_bool()).unwrap_or(false);
+
+        // Build the FlowResult
+        let fr = FlowResult::Streaming {
+            stream_id: stream_id.clone(),
+            metadata: stepflow_core::workflow::ValueRef::new(serde_json::Value::Object(map.clone())),
+            chunk: map.get("chunk").and_then(|v|v.as_str()).unwrap_or("").to_string(),
+            chunk_index,
+            is_final,
+        };
+
+        // Send to the step's channel (only if the sender still exists)
+        if let Some(tx) = coord.step_senders.get(&step_id) {
+            tracing::info!("Found sender for step {}, attempting to send chunk {}", step_id, chunk_index);
+            tracing::info!("HANDLE_CHUNK step={} idx={} final={}", step_id, chunk_index, is_final);
+            tracing::debug!("send -> {} (buffer={})", step_id, tx.capacity());
+            match tx.send(fr.clone()).await {
+                Ok(_) => {
+                    tracing::info!("Successfully routed chunk {} to step {} (pipeline steps: {:?})", chunk_index, step_id, coord.pipeline_steps);
+                }
+                Err(e) => {
+                    tracing::error!("Failed to route chunk {} to step {}: {:?}", chunk_index, step_id, e);
+                    return Err(ExecutionError::StepFailed { step: step_id.clone() }.into());
+                }
+            }
+        } else {
+            tracing::warn!("No channel for step {} (available steps: {:?})", step_id, coord.step_senders.keys().collect::<Vec<_>>());
+        }
+
+        Ok(())
+    }
+
+    /// Called by `WorkflowExecutor::route_streaming_chunk` to inject
+    /// *all* the chunks, not just the first.
+    pub async fn handle_chunk(&mut self, chunk_json: serde_json::Value) -> Result<()> {
+        let map = serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk_json)
+            .map_err(|e| ExecutionError::MalformedReference { message: e.to_string() })?;
+        
+        // Extract the step ID this chunk belongs to (default to first pipeline step)
+        let step_id = map.get("step_id")
+                          .and_then(|v| v.as_str())
+                          .map(|s| s.to_string())
+                          .unwrap_or_else(|| {
+                              // Default to first step (source step) if no step_id provided
+                              // This handles chunks coming from Python components that don't include step_id
+                              let first_step_idx = self.pipeline_steps[0];
+                              let first_step_id = self.flow.steps[first_step_idx].id.clone();
+                              tracing::info!("No step_id in chunk, defaulting to first pipeline step: {}", first_step_id);
+                              first_step_id
+                          });
+                          
+        let stream_id   = map.get("stream_id")  .and_then(|v| v.as_str()).unwrap_or_default().to_string();
+        let chunk_index = map.get("chunk_index").and_then(|v| v.as_u64()).unwrap_or(0) as usize;
+        let is_final    = map.get("is_final")   .and_then(|v| v.as_bool()).unwrap_or(false);
+
+        // Build the FlowResult
+        let fr = FlowResult::Streaming {
+            stream_id: stream_id.clone(),
+            metadata: stepflow_core::workflow::ValueRef::new(serde_json::Value::Object(map.clone())),
+            chunk: map.get("chunk").and_then(|v|v.as_str()).unwrap_or("").to_string(),
+            chunk_index,
+            is_final,
+        };
+
+        // Only deliver to the step itself - let the step handle forwarding downstream
+        if let Some(tx) = self.step_senders.get(&step_id) {
+            tracing::info!("Found sender for step {}, attempting to send chunk {}", step_id, chunk_index);
+            match tx.send(fr.clone()).await {
+                Ok(_) => {
+                    tracing::info!("Successfully routed chunk {} to step {} (pipeline steps: {:?})", chunk_index, step_id, self.pipeline_steps);
+                }
+                Err(e) => {
+                    tracing::error!("Failed to route chunk {} to step {}: {:?}", chunk_index, step_id, e);
+                    return Err(ExecutionError::StepFailed { step: step_id.clone() }.into());
+                }
+            }
+        } else {
+            tracing::warn!("No channel for step {} (available steps: {:?})", step_id, self.step_senders.keys().collect::<Vec<_>>());
+        }
+
+        Ok(())
+    }
+
     fn new(
         executor: Arc<StepFlowExecutor>,
         flow: Arc<Flow>,
         pipeline_steps: Vec<usize>,
         context: ExecutionContext,
+        resolver: ValueResolver,
     ) -> Self {
-        let mut step_connections = std::collections::HashMap::new();
         let mut step_receivers = std::collections::HashMap::new();
+        let mut step_downstream_senders = std::collections::HashMap::new();
+        let mut step_senders = std::collections::HashMap::new();
+
+        tracing::info!("[DEBUG-CHANNEL-SETUP] Creating channels for pipeline steps: {:?}", pipeline_steps);
 
-        // Create channels for each step
+        // Create input receivers for each step
         for &step_index in &pipeline_steps {
-            let (tx, rx) = tokio::sync::mpsc::channel(100); // Buffer 100 chunks
-            step_connections.insert(step_index, tx);
-            step_receivers.insert(step_index, rx);
+            let step_id = flow.steps[step_index].id.clone();
+            let (input_tx, input_rx) = tokio::sync::mpsc::channel(100);
+            let sender_clone = input_tx.clone();
+            step_senders.insert(step_id.clone(), sender_clone);
+            step_receivers.insert(step_id.clone(), input_rx);
+            tracing::info!("[DEBUG-CHANNEL] Created channel for step {} (index {}) - receiver capacity: {}", 
+                         step_id, step_index, 100);
+        }
+
+        // Set up the pipeline connections
+        tracing::info!("[DEBUG-CHANNEL-SETUP] Setting up pipeline connections for {} steps", pipeline_steps.len());
+        for i in 0..pipeline_steps.len() {
+            let step_index = pipeline_steps[i];
+            let step_id = flow.steps[step_index].id.clone();
+            tracing::info!("[DEBUG-CHANNEL-SETUP] Processing step {} ({}) at position {}", step_id, step_index, i);
+            
+            // Set up downstream senders for this step
+            let mut downstream_senders = Vec::new();
+            if i < pipeline_steps.len() - 1 {
+                // This step sends to the next step's input
+                let next_step_index = pipeline_steps[i + 1];
+                let next_step_id = flow.steps[next_step_index].id.clone();
+                if let Some(next_step_sender) = step_senders.get(&next_step_id).cloned() {
+                    downstream_senders.push(next_step_sender);
+                }
+            }
+            step_downstream_senders.insert(step_id, downstream_senders);
         }
 
         Self {
@@ -1239,223 +1441,436 @@ impl StreamingPipelineCoordinator {
             flow,
             pipeline_steps,
             context,
-            step_connections,
+            resolver,
             step_receivers,
+            step_downstream_senders,
+            step_senders,
         }
     }
 
-    async fn execute_pipeline(&mut self) -> Result<()> {
-        tracing::info!("Executing streaming pipeline with {} steps", self.pipeline_steps.len());
-        
-        // Create tasks for each streaming step
-        let mut tasks = Vec::new();
-        let flow_arc = self.flow.clone();
+
+    
+
+
+    /// Run the pipeline without holding the mutex lock
+    /// This allows route_streaming_chunk to acquire the lock while the pipeline is running
+    async fn run_pipeline_without_lock(coord_arc: Arc<tokio::sync::Mutex<Self>>) -> Result<()> {
+        tracing::info!("[DEBUG-PIPELINE] Starting pipeline execution without lock");
         
-        for &step_index in &self.pipeline_steps {
-            let flow_arc = flow_arc.clone();
-            let step_input = self.resolve_step_input(step_index).await?;
-            let downstream_senders = self.get_downstream_senders(step_index);
+        // Resolve step inputs and spawn tasks while holding the lock to avoid race conditions
+        let mut handles = Vec::new();
+        {
+            let mut guard = coord_arc.lock().await;
+            let pipeline_steps = guard.pipeline_steps.clone();
+            let executor = guard.executor.clone();
+            let flow = guard.flow.clone();
+            let context = guard.context.clone();
+            
+            // Resolve step inputs first
+            let mut step_inputs = std::collections::HashMap::new();
+            for &step_idx in &pipeline_steps {
+                let input = guard.resolve_step_input(step_idx).await?;
+                step_inputs.insert(step_idx, input);
+            }
             
-            if let Some(receiver) = self.step_receivers.remove(&step_index) {
-                let executor = self.executor.clone();
-                let context = self.context.clone();
-                let task = tokio::spawn(async move {
-                    let step = &flow_arc.steps[step_index];
-                    Self::run_streaming_step(
-                        executor,
-                        step,
-                        step_input,
-                        context,
-                        receiver,
-                        downstream_senders,
-                    ).await
+            // Now spawn all tasks while still holding the lock to prevent race conditions
+            for &step_idx in &pipeline_steps {
+                let step_id = flow.steps[step_idx].id.clone();
+                
+                // Take sender & receiver out now, before spawning
+                let rx = guard.step_receivers.remove(&step_id).ok_or_else(|| {
+                    ExecutionError::Internal
+                })?;
+                let _sender = guard.step_senders.get(&step_id).unwrap().clone(); // Keep sender in map for handle_chunk
+                let downstream = guard.step_downstream_senders
+                    .get(&step_id).cloned().unwrap_or_default();
+                let input = step_inputs.remove(&step_idx).ok_or_else(|| {
+                    ExecutionError::Internal
+                })?;
+                
+                tracing::info!("Starting step task for {} with receiver while holding lock", step_id);
+                let plugin = executor.get_plugin(&flow.steps[step_idx].component).await?;
+                let context = context.clone()
+                    .with_step(step_id.clone());
+                let step = flow.steps[step_idx].clone();
+                let is_source = step_idx == pipeline_steps[0];
+                
+                // Spawn while still holding the pieces and the lock
+                let h = tokio::spawn(async move {
+                    tracing::info!("Step task {} about to call run_streaming_step_simple", step_id);
+                    let result = run_streaming_step_simple(plugin, step, input, context, rx, downstream, is_source).await;
+                    tracing::info!("Step task {} finished run_streaming_step_simple: {:?}", step_id, result.is_ok());
+                    result
                 });
-                tasks.push(task);
+                handles.push((step_idx, h));
             }
+        } // Lock dropped NOW - after all tasks are spawned with their receivers
+
+        // Capture flow and pipeline_steps outside of the lock for later use
+        let (flow, pipeline_steps) = {
+            let guard = coord_arc.lock().await;
+            (guard.flow.clone(), guard.pipeline_steps.clone())
+        };
+        
+        // Give all tasks a moment to start
+        tracing::info!("[DEBUG-PIPELINE] Giving tasks 500ms to start up");
+        tokio::time::sleep(std::time::Duration::from_millis(500)).await;
+        
+        // Now trigger the source component to start generating chunks
+        if let Some(source_step_idx) = pipeline_steps.first() {
+            let source_step_id = flow.steps[*source_step_idx].id.clone();
+            tracing::info!("[DEBUG-PIPELINE] Triggering source component {} to start generating", source_step_id);
+            
+            // Get the step input for the source step
+            let source_input = {
+                let guard = coord_arc.lock().await;
+                guard.resolve_step_input(*source_step_idx).await?
+            };
+            
+            // Get the plugin for the source step
+            let source_plugin = {
+                let guard = coord_arc.lock().await;
+                guard.executor.get_plugin(&flow.steps[*source_step_idx].component).await?
+            };
+            
+            // Create execution context for the source step
+            let source_context = {
+                let guard = coord_arc.lock().await;
+                guard.context.clone().with_step(source_step_id.clone())
+            };
+            
+            // Trigger the source component in a separate task (fire and forget)
+            let source_step = flow.steps[*source_step_idx].clone();
+            tokio::spawn(async move {
+                tracing::info!("[DEBUG-GENERATOR] Starting source generator for {}", source_step_id);
+                match execute_step_async(source_plugin, &source_step, source_input, source_context).await {
+                    Ok(result) => {
+                        tracing::info!("[DEBUG-GENERATOR] Source generator {} completed: {:?}", source_step_id, result);
+                    }
+                    Err(e) => {
+                        tracing::error!("[DEBUG-GENERATOR] Source generator {} failed: {:?}", source_step_id, e);
+                    }
+                }
+            });
         }
         
-        // Wait for all streaming steps to complete
-        // Since streaming steps don't wait for input chunks anymore, they should complete quickly
-        for task in tasks {
-            task.await.map_err(|_e| ExecutionError::StepFailed { 
-                step: "streaming_pipeline".to_string() 
-            })??;
+        // Wait for all step handles to complete
+        tracing::info!("[DEBUG-PIPELINE] Waiting for all {} step handles to complete", handles.len());
+        for (step_idx, handle) in handles {
+            let step_id = &flow.steps[step_idx].id;
+            tracing::info!("[DEBUG-PIPELINE] Waiting for step {} to complete", step_id);
+            match handle.await {
+                Ok(result) => {
+                    if let Err(e) = result {
+                        tracing::warn!("Step {} completed with error: {:?}", step_id, e);
+                        return Err(e);
+                    } else {
+                        tracing::info!("Step {} completed successfully", step_id);
+                    }
+                }
+                Err(e) => {
+                    tracing::warn!("Step {} task panicked: {:?}", step_id, e);
+                    return Err(ExecutionError::Internal.into());
+                }
+            }
         }
         
+        tracing::info!("[DEBUG-PIPELINE] run_pipeline_without_lock completed successfully");
         Ok(())
     }
-    
+
     async fn resolve_step_input(&self, step_index: usize) -> Result<stepflow_core::workflow::ValueRef> {
-        // Create a basic input for streaming steps
-        // In a full implementation, this would resolve dependencies from previous steps
+        // For streaming steps, we need simpler input resolution
+        // since they don't depend on other steps' outputs
         let step = &self.flow.steps[step_index];
         
-        // For streaming steps, we typically need some basic configuration
-        let input = serde_json::json!({
-            "step_id": step.id,
-            "step_index": step_index,
-            "streaming": true,
-            "component": step.component.to_string()
-        });
-        
-        Ok(stepflow_core::workflow::ValueRef::new(input))
-    }
-
-    fn get_downstream_senders(&self, step_index: usize) -> Vec<tokio::sync::mpsc::Sender<FlowResult>> {
-        let mut senders = Vec::new();
-        
-        // Find steps that come after this step in the pipeline
-        for &other_step_index in &self.pipeline_steps {
-            if other_step_index > step_index {
-                if let Some(sender) = self.step_connections.get(&other_step_index) {
-                    senders.push(sender.clone());
-                }
+        // For streaming steps, resolve the input directly without dependencies
+        // This avoids the "undefined value" error for streaming pipelines
+        if step.streaming {
+            // For streaming steps, try to resolve the input expression directly
+            // If it fails, fall back to the workflow input
+            match self.resolver.resolve(&step.input).await {
+                Ok(FlowResult::Success { result }) => Ok(result),
+                Ok(FlowResult::Streaming { metadata, .. }) => Ok(metadata),
+                                 _ => {
+                     // Fall back to workflow input for streaming steps
+                     tracing::info!("[DEBUG-RESOLVE] Falling back to workflow input for streaming step {}", step.id);
+                     Ok(self.resolver.workflow_input().clone())
+                 }
             }
-        }
-        
-        senders
-    }
-    
-    async fn route_chunk_to_step(&mut self, step_index: usize, chunk: serde_json::Value) -> Result<()> {
-        if let Some(sender) = self.step_connections.get(&step_index) {
-            let flow_result = FlowResult::Streaming {
-                stream_id: "routed_chunk".to_string(),
-                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!({})),
-                chunk: chunk.to_string(),
-                chunk_index: 0,
-                is_final: false,
-            };
-            
-            sender.send(flow_result).await
-                .map_err(|e| ExecutionError::StepFailed { 
-                    step: format!("step_{}", step_index) 
-                })?;
-            
-            tracing::debug!("Successfully routed chunk to step {}", step_index);
         } else {
-            tracing::warn!("No sender found for step {}", step_index);
+            // For non-streaming steps, use the full resolver
+            let step_input = match self.resolver.resolve(&step.input).await? {
+                FlowResult::Success { result } => result,
+                FlowResult::Streaming { metadata, .. } => metadata,
+                FlowResult::Skipped => {
+                    return Err(ExecutionError::StepNotRunnable {
+                        step: step.id.clone(),
+                    }
+                    .into());
+                }
+                FlowResult::Failed { error } => {
+                    return Err(ExecutionError::StepFailed { step: step.id.clone() }.into());
+                }
+            };
+            Ok(step_input)
         }
-        
-        Ok(())
     }
 
-    async fn run_streaming_step(
-        executor: Arc<StepFlowExecutor>,
-        step: &stepflow_core::workflow::Step,
-        step_input: stepflow_core::workflow::ValueRef,
-        context: ExecutionContext,
-        mut receiver: tokio::sync::mpsc::Receiver<FlowResult>,
-        downstream_senders: Vec<tokio::sync::mpsc::Sender<FlowResult>>,
-    ) -> Result<()> {
-        let step_id = step.id.clone();
-        let plugin = executor.get_plugin(&step.component).await?;
 
-        tracing::info!("Starting streaming step: {}", step_id);
-
-        // Execute the step to get initial result with a timeout
-        let timeout_duration = std::time::Duration::from_secs(10);
-        let result = match tokio::time::timeout(timeout_duration, execute_step_async(plugin.clone(), step, step_input.clone(), context.clone())).await {
-            Ok(result) => result?,
-            Err(_) => {
-                tracing::error!("Streaming step {} timed out after {} seconds", step_id, timeout_duration.as_secs());
-                return Err(ExecutionError::StepFailed { step: step_id }.into());
-            }
-        };
+}
 
-        match result {
-            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
-                // Send the chunk to downstream steps
-                for sender in &downstream_senders {
-                    let _ = sender.send(FlowResult::Streaming {
-                        stream_id: stream_id.clone(),
-                        metadata: metadata.clone(),
-                        chunk: chunk.clone(),
-                        chunk_index,
-                        is_final,
-                    }).await;
-                }
+/// A per-step streaming loop: receive chunks, call your component, forward every chunk downstream,
+/// exit only when `is_final == true`.
+async fn run_streaming_step_simple(
+    plugin: Arc<DynPlugin<'static>>,
+    step: stepflow_core::workflow::Step,
+    input: stepflow_core::workflow::ValueRef,
+    context: ExecutionContext,
+    mut rx: mpsc::Receiver<FlowResult>,
+    downstream: Vec<mpsc::Sender<FlowResult>>,
+    is_source: bool,
+) -> Result<()> {
+    let step_id = step.id.clone();
+    stream_log!(info, &step_id, "starting (is_source={}, downstream={})", is_source, downstream.len());
+    
+    // For source steps, we now rely on the notification system to start the generator
+    // The generator will be triggered when the first chunk request comes in
+    if is_source {
+        stream_log!(info, &step_id, "source step entering receiver loop, generator will start via notifications");
+    } else {
+        stream_log!(info, &step_id, "sink/middle step entering receiver loop");
+    }
 
-                tracing::info!("Streaming step {} processed initial chunk, waiting for additional chunks", step_id);
+    // Now loop for all chunks coming through the coordinator's routing system
+    let mut last_stream_id = String::new();
+    let mut last_metadata = stepflow_core::workflow::ValueRef::new(serde_json::Value::Null);
+    let mut last_chunk = String::new();
+    let mut last_chunk_index = 0;
+    let mut last_is_final = false;
+    
+    loop {
+        tracing::info!("[STREAM] Step {} waiting for chunk via receiver", step_id);
+        let recv_result = rx.recv().await;
+        tracing::info!("[STREAM] Step {} received result from rx.recv(): {:?}", step_id, recv_result.is_some());
+        match recv_result {
+            Some(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final }) => {
+                stream_log!(info, &step_id, "RECEIVED chunk #{} from receiver", chunk_index);
+                tracing::info!("RX step={} idx={} final={} (source={})", step_id, chunk_index, is_final, is_source);
+                stream_log!(info, &step_id, "processing chunk #{}", chunk_index);
                 
-                // Now wait for additional chunks to come through the channel
-                // These chunks are routed from the notification system
-                let mut chunk_count = 1;
-                let max_chunks = 1000; // Safety limit
+                // Store the streaming metadata for potential use in non-streaming case
+                last_stream_id = stream_id.clone();
+                last_metadata = metadata.clone();
+                last_chunk = chunk.clone();
+                last_chunk_index = chunk_index;
+                last_is_final = is_final;
                 
-                while chunk_count < max_chunks {
-                    // Wait for chunks with a timeout
-                    match tokio::time::timeout(std::time::Duration::from_secs(5), receiver.recv()).await {
-                        Ok(Some(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final })) => {
-                            chunk_count += 1;
-                            tracing::debug!("Streaming step {} received chunk {}: stream_id={}, is_final={}", 
-                                step_id, chunk_count, stream_id, is_final);
-                            
-                            // Process the chunk by calling the step again
-                            let chunk_input = stepflow_core::workflow::ValueRef::new(serde_json::json!({
-                                "chunk": chunk,
-                                "stream_id": stream_id,
-                                "chunk_index": chunk_index,
-                                "is_final": is_final,
-                                "metadata": metadata.as_ref()
-                            }));
-                            
-                            let chunk_result = match tokio::time::timeout(
-                                std::time::Duration::from_secs(5), 
-                                execute_step_async(plugin.clone(), step, chunk_input, context.clone())
-                            ).await {
-                                Ok(result) => result?,
-                                Err(_) => {
-                                    tracing::warn!("Streaming step {} chunk processing timed out", step_id);
-                                    continue;
-                                }
-                            };
-                            
-                            // Send the processed chunk to downstream steps
-                            for sender in &downstream_senders {
-                                let _ = sender.send(chunk_result.clone()).await;
-                            }
-                            
-                            // If this is the final chunk, we're done
-                            if is_final {
-                                tracing::info!("Streaming step {} received final chunk, completing", step_id);
-                                break;
-                            }
+                // For non-source steps, call the component to process the chunk
+                let (final_stream_id, final_metadata, final_chunk, final_chunk_index, final_is_final) = if !is_source {
+                    // For non-source steps, we need to create a proper input that contains only the actual data
+                    // without any $from references, by extracting the relevant fields from the streaming chunk
+                    let chunk_input_data = serde_json::json!({
+                        "chunk": chunk,
+                        "stream_id": stream_id,
+                        "chunk_index": chunk_index,
+                        "is_final": is_final,
+                        // Add all the metadata fields from the streaming chunk
+                        "sample_rate": metadata.as_ref().get("sample_rate").unwrap_or(&serde_json::Value::Null),
+                        "channels": metadata.as_ref().get("channels").unwrap_or(&serde_json::Value::Null),
+                        "operation": metadata.as_ref().get("operation").unwrap_or(&serde_json::Value::Null),
+                        "output_file": metadata.as_ref().get("output_file").unwrap_or(&serde_json::Value::Null),
+                        "gain": metadata.as_ref().get("gain").unwrap_or(&serde_json::Value::Null),
+                    });
+                    let chunk_input = stepflow_core::workflow::ValueRef::new(chunk_input_data);
+                    
+                    // Call the component to process the chunk
+                    let step_context = context.clone().with_step(step.id.clone());
+                    match execute_step_async(plugin.clone(), &step, chunk_input, step_context).await? {
+                        FlowResult::Streaming { stream_id: processed_stream_id, metadata: processed_metadata, chunk: processed_chunk, chunk_index: processed_chunk_index, is_final: processed_is_final } => {
+                            tracing::info!("[STREAM] Step {} component processed chunk #{}", step_id, processed_chunk_index);
+                            (processed_stream_id, processed_metadata, processed_chunk, processed_chunk_index, processed_is_final)
                         }
-                        Ok(Some(_)) => {
-                            // Received non-streaming result, ignore
-                            continue;
+                        FlowResult::Success { .. } => {
+                            tracing::info!("[STREAM] Step {} component returned success, forwarding original chunk", step_id);
+                            // For success results, forward the original chunk
+                            (stream_id, metadata, chunk, chunk_index, is_final)
                         }
-                        Ok(None) => {
-                            // Channel closed, we're done
-                            tracing::info!("Streaming step {} channel closed, completing", step_id);
-                            break;
+                        other => {
+                            tracing::warn!("[STREAM] Step {} component returned unexpected result: {:?}", step_id, other);
+                            (stream_id, metadata, chunk, chunk_index, is_final)
                         }
-                        Err(_) => {
-                            // Timeout - no more chunks for now
-                            tracing::debug!("Streaming step {} no more chunks after timeout", step_id);
-                            break;
+                    }
+                } else {
+                    // Source step just forwards the chunk as-is
+                    (stream_id, metadata, chunk, chunk_index, is_final)
+                };
+                
+                // Forward to downstream steps
+                stream_log!(info, &step_id, "forwarding chunk #{} to {} downstream", final_chunk_index, downstream.len());
+                for (i, tx) in downstream.iter().enumerate() {
+                    match tx.send(FlowResult::Streaming {
+                        stream_id: final_stream_id.clone(),
+                        metadata: final_metadata.clone(),
+                        chunk: final_chunk.clone(),
+                        chunk_index: final_chunk_index,
+                        is_final: final_is_final,
+                    }).await {
+                        Ok(_) => {
+                            stream_log!(info, &step_id, "successfully forwarded chunk #{} to downstream {}", final_chunk_index, i);
+                        }
+                        Err(e) => {
+                            stream_log!(warn, &step_id, "failed to forward chunk #{} to downstream {}: {:?}", final_chunk_index, i, e);
                         }
                     }
                 }
-                
-                if chunk_count >= max_chunks {
-                    tracing::warn!("Streaming step {} reached maximum chunk limit ({})", step_id, max_chunks);
+
+                // Stop the *source* task once it sees its own final packet.
+                // Every other task keeps listening until its inbound channel is closed.
+                if is_source && final_is_final {
+                    stream_log!(info, &step_id, "saw final chunk, exiting");
+                    break;
                 }
             }
-            FlowResult::Success { result } => {
-                tracing::info!("Streaming step {} completed with success", step_id);
-            }
-            FlowResult::Failed { error } => {
-                tracing::error!("Streaming step {} failed: {:?}", step_id, error);
-                return Err(ExecutionError::StepFailed { step: step_id }.into());
+            Some(other) => {
+                stream_log!(warn, &step_id, "received non-streaming result: {:?}", other);
+                // Extract actual data from the non-streaming result and forward it as streaming
+                match other {
+                    FlowResult::Success { result } => {
+                        // Convert the success result to a streaming chunk
+                        for tx in &downstream {
+                            let _ = tx.send(FlowResult::Streaming {
+                                stream_id: last_stream_id.clone(),
+                                metadata: result.clone(),
+                                chunk: serde_json::to_string(result.as_ref()).unwrap_or_default(),
+                                chunk_index: last_chunk_index,
+                                is_final: last_is_final,
+                            }).await;
+                        }
+                    }
+                    _ => {
+                        // For other result types, use last known metadata
+                        for tx in &downstream {
+                            let _ = tx.send(FlowResult::Streaming {
+                                stream_id: last_stream_id.clone(),
+                                metadata: last_metadata.clone(),
+                                chunk: last_chunk.clone(),
+                                chunk_index: last_chunk_index,
+                                is_final: last_is_final,
+                            }).await;
+                        }
+                    }
+                }
+                // Only exit if this was truly the final chunk
+                if last_is_final {
+                    stream_log!(info, &step_id, "received final packet in non-streaming arm, exiting");
+                    break;
+                }
+                // Otherwise keep looping to process more chunks
             }
-            FlowResult::Skipped => {
-                tracing::info!("Streaming step {} skipped", step_id);
+            None => {
+                stream_log!(info, &step_id, "channel closed");
+                break;
             }
         }
+    }
+    
+    stream_log!(info, &step_id, "completed");
+    Ok(())
+}
 
-        Ok(())
+/// Sort streaming steps by their dependencies using a topological sort
+/// This ensures that source steps come before steps that depend on them
+fn sort_streaming_steps_by_dependencies(
+    flow: &Flow,
+    streaming_steps: Vec<usize>,
+) -> Result<Vec<usize>> {
+    use std::collections::{HashMap, HashSet, VecDeque};
+    
+    // Create a map of step ID to index for quick lookup
+    let step_id_to_index: HashMap<String, usize> = streaming_steps
+        .iter()
+        .map(|&idx| (flow.steps[idx].id.clone(), idx))
+        .collect();
+    
+    // Build dependency graph for streaming steps only
+    let mut dependencies: HashMap<usize, HashSet<usize>> = HashMap::new();
+    let mut dependents: HashMap<usize, HashSet<usize>> = HashMap::new();
+    
+    for &step_idx in &streaming_steps {
+        dependencies.insert(step_idx, HashSet::new());
+        dependents.insert(step_idx, HashSet::new());
     }
+    
+    // Analyze dependencies between streaming steps
+    for &step_idx in &streaming_steps {
+        let step = &flow.steps[step_idx];
+        
+        // Check if this step's input references other streaming steps
+        let input_str = serde_json::to_string(&step.input).unwrap_or_default();
+        
+        for &other_step_idx in &streaming_steps {
+            if step_idx != other_step_idx {
+                let other_step_id = &flow.steps[other_step_idx].id;
+                
+                // Check if step references other_step in its input
+                if input_str.contains(&format!("step: {}", other_step_id)) ||
+                   input_str.contains(&format!("\"step\": \"{}\"", other_step_id)) {
+                    // step_idx depends on other_step_idx
+                    dependencies.get_mut(&step_idx).unwrap().insert(other_step_idx);
+                    dependents.get_mut(&other_step_idx).unwrap().insert(step_idx);
+                    
+                    tracing::info!("Detected dependency: {} depends on {}", 
+                                 step.id, other_step_id);
+                }
+            }
+        }
+    }
+    
+    // Topological sort using Kahn's algorithm
+    let mut result = Vec::new();
+    let mut queue = VecDeque::new();
+    let mut remaining_deps = dependencies.clone();
+    
+    // Find steps with no dependencies (source steps)
+    for &step_idx in &streaming_steps {
+        if remaining_deps[&step_idx].is_empty() {
+            queue.push_back(step_idx);
+            tracing::info!("Found source streaming step: {}", flow.steps[step_idx].id);
+        }
+    }
+    
+    while let Some(current_step) = queue.pop_front() {
+        result.push(current_step);
+        
+        // Remove this step from its dependents' dependency lists
+        for &dependent_step in &dependents[&current_step] {
+            remaining_deps.get_mut(&dependent_step).unwrap().remove(&current_step);
+            
+            // If the dependent now has no dependencies, add it to the queue
+            if remaining_deps[&dependent_step].is_empty() {
+                queue.push_back(dependent_step);
+            }
+        }
+    }
+    
+    // Check for circular dependencies
+    if result.len() != streaming_steps.len() {
+        let remaining: Vec<String> = streaming_steps
+            .iter()
+            .filter(|&&idx| !result.contains(&idx))
+            .map(|&idx| flow.steps[idx].id.clone())
+            .collect();
+        
+        tracing::error!("Circular dependency detected in streaming steps: {:?}", remaining);
+        return Err(ExecutionError::Internal.into());
+    }
+    
+    tracing::info!("Topological sort result: {:?}",
+        result.iter().map(|i| &flow.steps[*i].id).collect::<Vec<_>>()
+    );
+    
+    Ok(result)
 }
 
 #[cfg(test)]
@@ -1789,8 +2204,6 @@ steps:
     component: mock://parallel1
     input:
       $from:
-        workflow: input
-  - id: step2
     component: mock://parallel2
     input:
       $from:
@@ -1825,7 +2238,6 @@ output:
             (
                 "mock://parallel2",
                 FlowResult::Success {
-                    result: ValueRef::new(step2_output.clone()),
                 },
             ),
             (
@@ -2120,3 +2532,9 @@ output:
         }
     }
 }
+
+
+
+
+
+
diff --git a/crates/stepflow-plugin/src/context.rs b/crates/stepflow-plugin/src/context.rs
index 4e55b56d..1c0e5ebc 100644
--- a/crates/stepflow-plugin/src/context.rs
+++ b/crates/stepflow-plugin/src/context.rs
@@ -61,6 +61,8 @@ pub trait Executor: Send + Sync {
 pub struct ExecutionContext {
     context: Arc<dyn Context>,
     execution_id: Uuid,
+    /// Optional step ID for streaming pipelines  
+    step_id: Option<String>,
 }
 
 impl ExecutionContext {
@@ -69,14 +71,26 @@ impl ExecutionContext {
         Self {
             context,
             execution_id,
+            step_id: None,
         }
     }
 
+    /// Add step ID to this context (builder pattern)
+    pub fn with_step(mut self, step_id: String) -> Self {
+        self.step_id = Some(step_id);
+        self
+    }
+
     /// Get the execution ID for this context.
     pub fn execution_id(&self) -> Uuid {
         self.execution_id
     }
 
+    /// Get the step ID for this context (if set).
+    pub fn step_id(&self) -> Option<&str> {
+        self.step_id.as_deref()
+    }
+
     /// Get a reference to the state store.
     pub fn state_store(&self) -> &Arc<dyn StateStore> {
         self.context.state_store()
diff --git a/crates/stepflow-protocol/Cargo.toml b/crates/stepflow-protocol/Cargo.toml
index 08a76542..59c9e95f 100644
--- a/crates/stepflow-protocol/Cargo.toml
+++ b/crates/stepflow-protocol/Cargo.toml
@@ -18,6 +18,7 @@ indexmap.workspace = true
 serde_json.workspace = true
 serde.workspace = true
 stepflow-core.workspace = true
+stepflow-execution.workspace = true
 stepflow-plugin.workspace = true
 thiserror.workspace = true
 tokio.workspace = true
diff --git a/crates/stepflow-protocol/src/blob_handlers.rs b/crates/stepflow-protocol/src/blob_handlers.rs
index 96ed90f6..fa259a9f 100644
--- a/crates/stepflow-protocol/src/blob_handlers.rs
+++ b/crates/stepflow-protocol/src/blob_handlers.rs
@@ -1,8 +1,10 @@
+use std::fmt;
 use error_stack::ResultExt as _;
 use futures::future::{BoxFuture, FutureExt as _};
 use serde::{Deserialize, Serialize};
 use serde_json::value::RawValue;
 use std::sync::Arc;
+use stepflow_execution::WorkflowExecutor;
 use stepflow_plugin::Context;
 use tokio::sync::mpsc;
 use uuid::Uuid;
@@ -175,23 +177,63 @@ impl IncomingHandler for StreamingChunkHandler {
         async move {
             // This is a notification (no ID), so we don't send a response
             // Instead, we need to handle the streaming chunk
-            match serde_json::from_str::<StreamingChunkNotification>(params.get()) {
+                            match serde_json::from_str::<StreamingChunkNotification>(params.get()) {
                 Ok(notification) => {
-                    tracing::info!("Received streaming chunk for request {}: {:?}", 
-                                  notification.request_id, notification.chunk);
+                    tracing::info!("Received streaming chunk for request {}: step_id={:?}, chunk_index={}", 
+                                  notification.request_id, notification.step_id, notification.chunk_index);
                     
                     // Route this chunk to the appropriate workflow executor
                     if let Some(executor) = context.executor() {
+                        tracing::debug!("Executor available, attempting to parse execution ID: {}", notification.request_id);
+                        
                         if let Ok(execution_id) = Uuid::parse_str(&notification.request_id) {
+                            tracing::info!("Successfully parsed execution ID: {}", execution_id);
+                            tracing::info!("Looking up workflow executor for execution ID: {}", execution_id);
+                            
                             // Try to find the workflow executor for this execution
-                            if let Ok(Some(mut workflow_executor)) = executor.get_workflow_executor(execution_id).await {
-                                // For now, just log that we received the chunk
-                                // TODO: Implement proper chunk routing when the streaming pipeline is ready
-                                tracing::info!("Received streaming chunk for execution {}: {:?}", 
-                                              execution_id, notification.chunk);
-                                tracing::warn!("Streaming chunk routing not yet implemented for trait objects");
-                            } else {
+                            match executor.get_workflow_executor(execution_id).await {
+                                Ok(Some(workflow_executor_any)) => {
+                                    tracing::info!("Found workflow executor for execution ID: {}", execution_id);
+                                    
+                                    // Downcast to the concrete WorkflowExecutor type
+                                    match workflow_executor_any.downcast::<Arc<tokio::sync::Mutex<WorkflowExecutor>>>() {
+                                        Ok(workflow_executor_arc) => {
+                                            tracing::debug!("Successfully downcast to Arc<Mutex<WorkflowExecutor>>, routing chunk");
+                                            
+                                            // Lock the mutex to access the workflow executor
+                                            let mut workflow_executor = workflow_executor_arc.lock().await;
+                                            
+                                            // Route the chunk to the workflow executor with full metadata
+                                            let chunk_with_metadata = serde_json::json!({
+                                                "request_id": notification.request_id,
+                                                "stream_id": notification.stream_id,
+                                                "chunk_index": notification.chunk_index,
+                                                "is_final": notification.is_final,
+                                                "step_id": notification.step_id,
+                                                "chunk": notification.chunk
+                                            });
+                                            tracing::info!("Sending chunk to workflow executor with step_id={:?}", notification.step_id);
+                                            match workflow_executor.route_streaming_chunk(chunk_with_metadata).await {
+                                                Ok(_) => {
+                                                    tracing::debug!("Successfully routed streaming chunk to workflow executor");
+                                                }
+                                                Err(e) => {
+                                                    tracing::error!("Failed to route streaming chunk to workflow executor: {:?}", e);
+                                                }
+                                            }
+                                        }
+                                        Err(_) => {
+                                            tracing::warn!("Failed to downcast workflow executor to Arc<Mutex<WorkflowExecutor>> type for execution ID: {}", execution_id);
+                                        }
+                                    }
+                                }
+                                Ok(None) => {
                                 tracing::warn!("No workflow executor found for execution ID: {}", execution_id);
+                                    tracing::error!("Failed to route streaming chunk to workflow executor: no executor found for execution ID {}", execution_id);
+                                }
+                                Err(e) => {
+                                    tracing::error!("Error getting workflow executor for execution ID {}: {:?}", execution_id, e);
+                                }
                             }
                         } else {
                             tracing::warn!("Invalid execution ID in streaming chunk: {}", notification.request_id);
@@ -212,8 +254,22 @@ impl IncomingHandler for StreamingChunkHandler {
     }
 }
 
-#[derive(Debug, Deserialize)]
+#[derive(Deserialize)]
 struct StreamingChunkNotification {
     request_id: String,
+    stream_id: String,
+    chunk_index: u64,
+    is_final: bool,
+    step_id: Option<String>,
     chunk: serde_json::Value,
 }
+
+impl fmt::Debug for StreamingChunkNotification {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.debug_struct("StreamingChunkNotification")
+            .field("request_id", &self.request_id)
+            // just show that it exists, not its contents
+            .field("chunk", &"<omitted base64>")
+            .finish()
+    }
+}
diff --git a/crates/stepflow-protocol/src/incoming_handler.rs b/crates/stepflow-protocol/src/incoming_handler.rs
index f61fdddc..d41b0af5 100644
--- a/crates/stepflow-protocol/src/incoming_handler.rs
+++ b/crates/stepflow-protocol/src/incoming_handler.rs
@@ -77,7 +77,9 @@ impl IncomingHandlerRegistry {
         response_tx: mpsc::Sender<String>,
         context: Arc<dyn Context>,
     ) {
+        tracing::debug!("Looking for handler for method: {}", method);
         if let Some(handler) = self.handlers.get(&method) {
+            tracing::debug!("Found handler for method: {}", method);
             // Now we can spawn the handler with owned values
             let future =
                 handler.handle_incoming(method.clone(), params, id, response_tx.clone(), context);
@@ -87,6 +89,7 @@ impl IncomingHandlerRegistry {
                 }
             });
         } else {
+            tracing::debug!("No handler found for method: {}", method);
             // Send error response for unknown method if it's a method call (has ID)
             if let Some(id) = id {
                 tracing::error!("Unknown method: {}", method);
diff --git a/crates/stepflow-protocol/src/schema/component_execute.rs b/crates/stepflow-protocol/src/schema/component_execute.rs
index b4c2e609..c90b8690 100644
--- a/crates/stepflow-protocol/src/schema/component_execute.rs
+++ b/crates/stepflow-protocol/src/schema/component_execute.rs
@@ -1,5 +1,6 @@
 use serde::{Deserialize, Serialize};
 use stepflow_core::workflow::{Component, ValueRef};
+use uuid::Uuid;
 
 use crate::schema::Method;
 
@@ -8,6 +9,8 @@ use crate::schema::Method;
 pub struct Request {
     pub component: Component,
     pub input: ValueRef,
+    pub execution_id: Uuid,
+    pub step_id: String,
 }
 
 /// Response to the initialization request.
diff --git a/crates/stepflow-protocol/src/stdio/client.rs b/crates/stepflow-protocol/src/stdio/client.rs
index 7448a22e..63c7a994 100644
--- a/crates/stepflow-protocol/src/stdio/client.rs
+++ b/crates/stepflow-protocol/src/stdio/client.rs
@@ -33,6 +33,7 @@ impl Client {
         let (outgoing_tx, outgoing_rx) = mpsc::channel(100);
         let (pending_tx, pending_rx) = mpsc::channel(100);
 
+        //let recv_span = tracing::info_span!("recv_message_loop", command = ?launcher.command, args = ?launcher.args);
         let recv_span = tracing::info_span!("recv_message_loop", command = ?launcher.command, args = ?launcher.args);
         let loop_handle = tokio::spawn(
             recv_message_loop(
diff --git a/crates/stepflow-protocol/src/stdio/plugin.rs b/crates/stepflow-protocol/src/stdio/plugin.rs
index 4cfa1e9b..d4fd3f2a 100644
--- a/crates/stepflow-protocol/src/stdio/plugin.rs
+++ b/crates/stepflow-protocol/src/stdio/plugin.rs
@@ -140,7 +140,7 @@ impl Plugin for StdioPlugin {
     async fn execute(
         &self,
         component: &Component,
-        _context: ExecutionContext,
+        context: ExecutionContext,
         input: ValueRef,
     ) -> Result<FlowResult> {
         let client_handle = self.client_handle().await?;
@@ -148,10 +148,107 @@ impl Plugin for StdioPlugin {
             .request(&crate::schema::component_execute::Request {
                 component: component.clone(),
                 input,
+                execution_id: context.execution_id(),
+                step_id: context.step_id().unwrap_or("unknown").to_string(),
             })
             .await
             .change_context(PluginError::Execution)?;
 
+        tracing::debug!("StdioPlugin: Received response: {:?}", response.output);
+
+        // Check if the response contains a FlowResult by looking for the "outcome" field
+        if let Some(outcome_obj) = response.output.as_object() {
+            if let Some(outcome_value) = outcome_obj.get("outcome") {
+                if let Some(outcome_str) = outcome_value.as_str() {
+                    tracing::debug!("StdioPlugin: Found outcome field with value: {}", outcome_str);
+                    // If the response has an "outcome" field, try to deserialize it as a FlowResult
+                    match outcome_str {
+                        "streaming" => {
+                            // Try to deserialize as FlowResult::Streaming
+                            tracing::debug!("StdioPlugin: Attempting to deserialize streaming result");
+                            match serde_json::from_value::<stepflow_core::FlowResult>(response.output.as_ref().clone()) {
+                                Ok(flow_result) => {
+                                    tracing::info!("StdioPlugin: Successfully deserialized streaming result");
+                                    return Ok(flow_result);
+                                }
+                                Err(e) => {
+                                    tracing::warn!("Failed to deserialize streaming result: {}, attempting flexible construction", e);
+                                    // Try to flexibly construct FlowResult::Streaming by adapting the structure
+                                    if let Some(obj) = response.output.as_ref().as_object() {
+                                        // Try to extract core streaming fields with flexible typing
+                                        let stream_id = obj.get("stream_id")
+                                            .and_then(|v| v.as_str())
+                                            .unwrap_or("unknown");
+
+                                        let chunk = obj.get("chunk")
+                                            .and_then(|v| v.as_str())
+                                            .unwrap_or("");
+
+                                        let chunk_index = obj.get("chunk_index")
+                                            .and_then(|v| v.as_u64().or_else(|| v.as_i64().map(|i| i as u64)))
+                                            .unwrap_or(0) as usize;
+
+                                        let is_final = obj.get("is_final")
+                                            .and_then(|v| v.as_bool())
+                                            .unwrap_or(false);
+
+                                        // If we have a metadata field, use it; otherwise create one from remaining fields
+                                        let metadata = if let Some(existing_metadata) = obj.get("metadata") {
+                                            stepflow_core::workflow::ValueRef::new(existing_metadata.clone())
+                                        } else {
+                                            // Create metadata from all fields except the core streaming ones
+                                            let mut metadata_obj = serde_json::Map::new();
+                                            for (key, value) in obj.iter() {
+                                                if !matches!(key.as_str(), "outcome" | "stream_id" | "chunk" | "chunk_index" | "is_final") {
+                                                    metadata_obj.insert(key.clone(), value.clone());
+                                                }
+                                            }
+                                            stepflow_core::workflow::ValueRef::new(serde_json::Value::Object(metadata_obj))
+                                        };
+
+                                        let flow_result = stepflow_core::FlowResult::Streaming {
+                                            stream_id: stream_id.to_string(),
+                                            metadata,
+                                            chunk: chunk.to_string(),
+                                            chunk_index,
+                                            is_final,
+                                        };
+
+                                        tracing::info!("StdioPlugin: Successfully constructed streaming result flexibly");
+                                        return Ok(flow_result);
+                                    }
+                                    tracing::warn!("Failed to flexibly construct streaming result, falling back to Success");
+                                }
+                            }
+                        }
+                        "success" | "failed" | "skipped" => {
+                            // Try to deserialize as any FlowResult variant
+                            match serde_json::from_value::<stepflow_core::FlowResult>(response.output.as_ref().clone()) {
+                                Ok(flow_result) => {
+                                    tracing::debug!("StdioPlugin: Successfully deserialized FlowResult: {:?}", flow_result);
+                                    return Ok(flow_result);
+                                }
+                                Err(e) => {
+                                    tracing::warn!("Failed to deserialize FlowResult: {}, falling back to Success", e);
+                                }
+                            }
+                        }
+                        _ => {
+                            // Unknown outcome, treat as regular success
+                            tracing::debug!("StdioPlugin: Unknown outcome '{}', treating as regular success", outcome_str);
+                        }
+                    }
+                } else {
+                    tracing::debug!("StdioPlugin: outcome field is not a string");
+                }
+            } else {
+                tracing::debug!("StdioPlugin: No outcome field found in response");
+            }
+        } else {
+            tracing::debug!("StdioPlugin: Response output is not an object");
+        }
+
+        // Default behavior: wrap in Success
         Ok(FlowResult::Success {
             result: response.output,
         })
diff --git a/crates/stepflow-protocol/src/stdio/recv_message_loop.rs b/crates/stepflow-protocol/src/stdio/recv_message_loop.rs
index ab4d2809..18314983 100644
--- a/crates/stepflow-protocol/src/stdio/recv_message_loop.rs
+++ b/crates/stepflow-protocol/src/stdio/recv_message_loop.rs
@@ -11,6 +11,7 @@ use tokio::{
     },
 };
 use tokio_stream::{StreamExt as _, wrappers::LinesStream};
+use tracing::info;
 use uuid::Uuid;
 
 use crate::stdio::{Result, StdioError};
@@ -90,6 +91,7 @@ impl ReceiveMessageLoop {
             Some(stderr_line) = self.from_child_stderr.next() => {
                 let stderr_line = stderr_line.change_context(StdioError::Recv)?;
                 tracing::info!("Component stderr: {stderr_line}");
+                eprintln!("[component stderr] {stderr_line}");
                 Ok(true)
             }
             Some(line) = self.from_child_stdout.next() => {
@@ -100,7 +102,7 @@ impl ReceiveMessageLoop {
                     tracing::warn!("Received very long message ({} chars), may be truncated", line.len());
                 }
                 
-                tracing::info!("Received line from child: {line:?}");
+                tracing::info!("Received line from child");
                 
                 // Add better error handling for JSON parsing
                 let msg = match OwnedIncoming::try_new(line.clone()) {
@@ -128,6 +130,143 @@ impl ReceiveMessageLoop {
                             tracing::error!("Full message: {}", line);
                         }
                         
+                        // Try to handle concatenated JSON messages
+                        if open_braces > 1 && close_braces > 1 {
+                            tracing::info!("Attempting to split concatenated JSON messages");
+                            let mut current_pos = 0;
+                            let mut brace_count = 0;
+                            let mut start_pos = 0;
+                            let mut messages_parsed = 0;
+                            
+                            for (i, ch) in line.chars().enumerate() {
+                                if ch == '{' {
+                                    if brace_count == 0 {
+                                        start_pos = i;
+                                    }
+                                    brace_count += 1;
+                                } else if ch == '}' {
+                                    brace_count -= 1;
+                                    if brace_count == 0 {
+                                        // We have a complete JSON object
+                                        let json_str = &line[start_pos..=i];
+                                        match OwnedIncoming::try_new(json_str.to_string()) {
+                                            Ok(msg) => {
+                                                tracing::info!("Successfully parsed concatenated message #{}", messages_parsed + 1);
+                                                messages_parsed += 1;
+                                                
+                                                // Process this message
+                                                match (msg.method, msg.params, msg.id) {
+                                                    (Some(method), Some(params), _) => {
+                                                        let method_owned = method.to_string();
+                                                        let params_owned: Box<serde_json::value::RawValue> = params.to_owned();
+                                                        
+                                                        if let Ok(v)=serde_json::from_str::<serde_json::Value>(params_owned.get()){info!(method=%method_owned,request_id=%v["request_id"].as_str().unwrap_or("<unknown>"),stream_id=%v["stream_id"].as_str().unwrap_or("<unknown>"),chunk_index=v["chunk_index"].as_u64().unwrap_or_default(),is_final=v["is_final"].as_bool().unwrap_or(false),output_file=%v["output_file"].as_str().unwrap_or("<unknown>"),"Received incoming method call");}
+                                                        IncomingHandlerRegistry::instance().spawn_handle_incoming(method_owned, params_owned, msg.id, self.outgoing_tx.clone(), context.clone());
+                                                    }
+                                                    (None, None, Some(id)) => {
+                                                        // Handle method response
+                                                        if let Some(pending) = self.pending_requests.remove(&id) {
+                                                            pending.send(msg).map_err(|_| StdioError::Send)?;
+                                                        }
+                                                    }
+                                                    _ => {
+                                                        tracing::warn!("Received invalid concatenated message: {:?}", msg);
+                                                    }
+                                                }
+                                            }
+                                            Err(parse_err) => {
+                                                tracing::warn!("Failed to parse concatenated JSON message: {}", parse_err);
+                                            }
+                                        }
+                                    }
+                                }
+                            }
+                            
+                            if messages_parsed > 0 {
+                                tracing::info!("Successfully parsed {} concatenated messages", messages_parsed);
+                                return Ok(true);
+                            }
+                        }
+                        
+                        // Try more aggressive message recovery for edge cases
+                        tracing::info!("Attempting aggressive message recovery");
+                        let mut messages_parsed = 0;
+                        
+                        // Try to find valid JSON objects by looking for complete message patterns
+                        let mut pos = 0;
+                        while pos < line.len() {
+                            // Find the start of a potential JSON object
+                            if let Some(start) = line[pos..].find("{\"jsonrpc\":\"2.0\"") {
+                                let start_pos = pos + start;
+                                
+                                // Try to find the matching closing brace
+                                let mut brace_count = 0;
+                                let mut end_pos = start_pos;
+                                let mut found_end = false;
+                                
+                                for (i, ch) in line[start_pos..].chars().enumerate() {
+                                    if ch == '{' {
+                                        brace_count += 1;
+                                    } else if ch == '}' {
+                                        brace_count -= 1;
+                                        if brace_count == 0 {
+                                            end_pos = start_pos + i;
+                                            found_end = true;
+                                            break;
+                                        }
+                                    }
+                                }
+                                
+                                if found_end {
+                                    let json_str = &line[start_pos..=end_pos];
+                                    match OwnedIncoming::try_new(json_str.to_string()) {
+                                        Ok(msg) => {
+                                            tracing::info!("Successfully recovered message #{}", messages_parsed + 1);
+                                            messages_parsed += 1;
+                                            
+                                            // Process this message
+                                            match (msg.method, msg.params, msg.id) {
+                                                (Some(method), Some(params), _) => {
+                                                    let method_owned = method.to_string();
+                                                    let params_owned: Box<serde_json::value::RawValue> = params.to_owned();
+                                                    
+                                                    if let Ok(v)=serde_json::from_str::<serde_json::Value>(params_owned.get()){info!(method=%method_owned,request_id=%v["request_id"].as_str().unwrap_or("<unknown>"),stream_id=%v["stream_id"].as_str().unwrap_or("<unknown>"),chunk_index=v["chunk_index"].as_u64().unwrap_or_default(),is_final=v["is_final"].as_bool().unwrap_or(false),output_file=%v["output_file"].as_str().unwrap_or("<unknown>"),"Received incoming method call");}
+                                                    IncomingHandlerRegistry::instance().spawn_handle_incoming(method_owned, params_owned, msg.id, self.outgoing_tx.clone(), context.clone());
+                                                }
+                                                (None, None, Some(id)) => {
+                                                    // Handle method response
+                                                    if let Some(pending) = self.pending_requests.remove(&id) {
+                                                        pending.send(msg).map_err(|_| StdioError::Send)?;
+                                                    }
+                                                }
+                                                _ => {
+                                                    tracing::warn!("Received invalid recovered message: {:?}", msg);
+                                                }
+                                            }
+                                            
+                                            // Move position to after this message
+                                            pos = end_pos + 1;
+                                        }
+                                        Err(parse_err) => {
+                                            tracing::warn!("Failed to parse recovered JSON message: {}", parse_err);
+                                            pos = start_pos + 1;
+                                        }
+                                    }
+                                } else {
+                                    // No matching end found, move to next potential start
+                                    pos = start_pos + 1;
+                                }
+                            } else {
+                                // No more JSON objects found
+                                break;
+                            }
+                        }
+                        
+                        if messages_parsed > 0 {
+                            tracing::info!("Successfully recovered {} messages", messages_parsed);
+                            return Ok(true);
+                        }
+                        
                         // Instead of returning an error and terminating the loop,
                         // log the error and continue processing other messages
                         tracing::warn!("Skipping malformed message and continuing...");
@@ -143,7 +282,7 @@ impl ReceiveMessageLoop {
                         let params_owned: Box<serde_json::value::RawValue> = params.to_owned();
 
                         // Handle the incoming method call
-                        tracing::info!("Received incoming method call: {} with params: {:?}", method_owned, params_owned);
+                        if let Ok(v)=serde_json::from_str::<serde_json::Value>(params_owned.get()){info!(method=%method_owned,request_id=%v["request_id"].as_str().unwrap_or("<unknown>"),stream_id=%v["stream_id"].as_str().unwrap_or("<unknown>"),chunk_index=v["chunk_index"].as_u64().unwrap_or_default(),is_final=v["is_final"].as_bool().unwrap_or(false),output_file=%v["output_file"].as_str().unwrap_or("<unknown>"),"Received incoming method call");}
                         IncomingHandlerRegistry::instance().spawn_handle_incoming(method_owned, params_owned, msg.id, self.outgoing_tx.clone(), context.clone());
                         Ok(true)
                     }
diff --git a/examples/audio-streaming-pipeline.yaml b/examples/audio-streaming-pipeline.yaml
index 1e333f69..becab47a 100644
--- a/examples/audio-streaming-pipeline.yaml
+++ b/examples/audio-streaming-pipeline.yaml
@@ -65,6 +65,7 @@ steps:
       sample_rate: { $from: { step: audio_source }, path: sample_rate }
       channels: { $from: { step: audio_source }, path: channels }
       operation: { $from: { workflow: input }, path: operation }
+      output_file: { $from: { workflow: input }, path: output_file }
 
   # Output the processed chunks
   - id: output_chunk
@@ -77,6 +78,6 @@ steps:
       output_file: { $from: { workflow: input }, path: output_file }
 
 output:
-  processed_chunks: { $from: { step: output_chunk }, path: result }
-  source_metadata: { $from: { step: audio_source }, path: sample_rate }
-  processing_metadata: { $from: { step: process_chunk }, path: sample_rate } 
\ No newline at end of file
+  # Note: Streaming steps don't have final results in the state store
+  # The output file is written directly by the audio_sink component
+  message: "Audio streaming pipeline completed" 
\ No newline at end of file
diff --git a/examples/audio_input.json b/examples/audio_input.json
index 25a274dd..051ba0e5 100644
--- a/examples/audio_input.json
+++ b/examples/audio_input.json
@@ -6,6 +6,6 @@
   "chunk_size": 1024,
   "frequency": 440.0,
   "duration": 3.0,
-  "output_file": "test_workflow_webcam.wav",
+  "output_file": "output.wav",
   "device_name": "C922 Pro Stream Webcam"
 }
diff --git a/examples/test_audio_pipeline.sh b/examples/test_audio_pipeline.sh
index 6a6d16df..3ede2265 100755
--- a/examples/test_audio_pipeline.sh
+++ b/examples/test_audio_pipeline.sh
@@ -6,6 +6,11 @@
 
 set -e  # Exit on any error
 
+# Always reinstall the Python SDK in editable mode before running the test
+cd "$(dirname "$0")/../sdks/python"
+uv pip install -e .
+cd - > /dev/null
+
 # Get script directory and current working directory
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 CURRENT_DIR="$(pwd)"
@@ -50,6 +55,12 @@ DURATION=${3:-"3.0"}
 OUTPUT_FILE=${4:-"test_workflow_webcam.wav"}
 DEVICE_NAME=${5:-"C922 Pro Stream Webcam"}
 
+# Set defaults for other parameters if not set
+SAMPLE_RATE=${SAMPLE_RATE:-44100}
+CHANNELS=${CHANNELS:-1}
+CHUNK_SIZE=${CHUNK_SIZE:-1024}
+FREQUENCY=${FREQUENCY:-440.0}
+
 # Determine the absolute path for the output file
 # The Python SDK runs from the examples directory, so it will create the file there
 if [[ "$CURRENT_DIR" == "$SCRIPT_DIR" ]]; then
@@ -68,24 +79,24 @@ echo "Output: $ABSOLUTE_OUTPUT_FILE"
 echo "Device: $DEVICE_NAME"
 echo ""
 
-# Create a temporary input file with the provided parameters
+# Create temporary input file
 TEMP_INPUT=$(mktemp --suffix=.json)
 cat > "$TEMP_INPUT" << EOF
 {
   "source": "$SOURCE",
-  "operation": "$OPERATION",
-  "sample_rate": 44100,
-  "channels": 1,
-  "chunk_size": 1024,
-  "frequency": 440.0,
   "duration": $DURATION,
-  "output_file": "$ABSOLUTE_OUTPUT_FILE",
-  "device_name": "$DEVICE_NAME"
+  "sample_rate": $SAMPLE_RATE,
+  "channels": $CHANNELS,
+  "chunk_size": $CHUNK_SIZE,
+  "frequency": $FREQUENCY,
+  "output_file": "$OUTPUT_FILE",
+  "device_name": "$DEVICE_NAME",
+  "operation": "$OPERATION"
 }
 EOF
 
 echo "📝 Using input configuration:"
-cat "$TEMP_INPUT"
+cat "$TEMP_INPUT" | jq '.'
 echo ""
 
 # Run the workflow
diff --git a/sdks/python/src/stepflow_sdk/audio_components.py b/sdks/python/src/stepflow_sdk/audio_components.py
index 0a921e9b..9b811fe8 100644
--- a/sdks/python/src/stepflow_sdk/audio_components.py
+++ b/sdks/python/src/stepflow_sdk/audio_components.py
@@ -16,6 +16,11 @@
 import queue
 import sys
 import numpy as np
+import datetime
+
+# GUARANTEED DEBUG OUTPUT - This should appear every time the module is loaded
+sys.stderr.write("=== AUDIO_COMPONENTS.PY MODULE LOADED ===\n")
+sys.stderr.flush()
 
 try:
     import sounddevice as sd
@@ -32,16 +37,17 @@ class AudioChunk:
     channels: int
     chunk_index: int
     timestamp: float
+    stream_id: str
 
 
 class AudioStreamSource:
     """Individual audio source component for generating audio chunks."""
     
-    def __init__(self, sample_rate: int = 16000, channels: int = 1, chunk_size: int = 1024):
+    def __init__(self, sample_rate: int = 16000, channels: int = 1, chunk_size: int = 1024, stream_id: str = None):
         self.sample_rate = sample_rate
         self.channels = channels
         self.chunk_size = chunk_size
-        self.stream_id = str(uuid.uuid4())
+        self.stream_id = stream_id or str(uuid.uuid4())
     
     def start_microphone_stream(self):
         """Initialize microphone stream."""
@@ -74,7 +80,8 @@ def get_microphone_chunk(self) -> AudioChunk:
             sample_rate=self.sample_rate,
             channels=self.channels,
             chunk_index=0,
-            timestamp=time.time()
+            timestamp=time.time(),
+            stream_id=self.stream_id
         )
     
     def generate_sine_wave_chunk(self, frequency: float = 440.0, duration: float = 0.1) -> AudioChunk:
@@ -94,7 +101,8 @@ def generate_sine_wave_chunk(self, frequency: float = 440.0, duration: float = 0
             sample_rate=self.sample_rate,
             channels=self.channels,
             chunk_index=0,
-            timestamp=time.time()
+            timestamp=time.time(),
+            stream_id=self.stream_id
         )
     
     def start_system_audio_stream(self):
@@ -107,7 +115,7 @@ def start_system_audio_stream(self):
         if not self.device_info:
             raise RuntimeError("No suitable system audio device found")
         
-        print(f"Using system audio device: {self.device_info['name']}", file=sys.stderr)
+        log_debug(f"Using system audio device: {self.device_info['name']}", "audio_stream_source")
     
     def _find_system_audio_device(self):
         """Find a suitable system audio device."""
@@ -145,10 +153,18 @@ def get_system_audio_chunk(self):
             sample_rate=self.sample_rate,
             channels=self.channels,
             chunk_index=0,
-            timestamp=time.time()
+            timestamp=time.time(),
+            stream_id=self.stream_id
         )
 
 
+def log_debug(message, component="unknown"):
+    """Write debug message to stderr so it shows up in StepFlow logs."""
+    timestamp = datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+    sys.stderr.write(f"[{timestamp}] [{component}] {message}\n")
+    sys.stderr.flush()  # Ensure it is written immediately
+
+
 def audio_stream_source(data: Dict[str, Any], context=None):
     """
     Component that generates audio stream chunks.
@@ -166,19 +182,31 @@ def audio_stream_source(data: Dict[str, Any], context=None):
     Output:
         Streaming audio chunks with metadata
     """
-    import time
-    start_time = time.time()
+    # Test stderr output
+    log_debug("TEST: audio_stream_source function called", "audio_stream_source")
     
+    log_debug(f"audio_stream_source received input data: {data}", "audio_stream_source")
+    
+    # Extract parameters from input data
     source_type = data.get('source', 'sine_wave')
-    duration = data.get('duration', 5.0)
     requested_sample_rate = data.get('sample_rate', 44100)
+    device_name = data.get('device_name', None)
+    duration = data.get('duration', 5.0)
     channels = data.get('channels', 1)
     chunk_size = data.get('chunk_size', 1024)
     frequency = data.get('frequency', 440.0)
     output_file = data.get('output_file', 'output_audio.wav')
-    device_name = data.get('device_name', None)
     
-    print(f"TIMING: Starting audio_stream_source at {start_time}", file=sys.stderr)
+    log_debug(f"Extracted parameters - source_type: {source_type}, requested_sample_rate: {requested_sample_rate}, device_name: {device_name}", "audio_stream_source")
+    
+    start_time = time.time()
+    
+    # Debug: Print the actual input data
+    log_debug(f"DEBUG: audio_stream_source received input data: {data}", "audio_stream_source")
+    
+    stream_id = str(uuid.uuid4())
+    
+    log_debug(f"TIMING: Starting audio_stream_source at {start_time}", "audio_stream_source")
     
     # Initialize PyAudio
     audio = pyaudio.PyAudio()
@@ -190,34 +218,52 @@ def audio_stream_source(data: Dict[str, Any], context=None):
             info = audio.get_device_info_by_index(i)
             if device_name.lower() in info['name'].lower():
                 device_index = i
-                print(f"Found device: {info['name']} (index {i})", file=sys.stderr)
+                log_debug(f"Found device: {info['name']} (index {i})", "audio_stream_source")
                 break
     
-    # Auto-detect sample rate if device is specified
+    # Auto-detect sample rate if device is specified and requested rate fails
     sample_rate = requested_sample_rate
     if device_index is not None:
-        sample_rates = [16000, 22050, 44100, 48000]
-        for rate in sample_rates:
-            try:
-                test_stream = audio.open(format=pyaudio.paInt16,
-                                        channels=channels,
-                                        rate=rate,
-                                        input=True,
-                                        input_device_index=device_index,
-                                        frames_per_buffer=chunk_size)
-                test_stream.close()
-                sample_rate = rate
-                print(f"Using sample rate: {sample_rate} Hz for device", file=sys.stderr)
-                break
-            except OSError:
-                continue
+        # First try the requested sample rate
+        try:
+            test_stream = audio.open(format=pyaudio.paInt16,
+                                    channels=channels,
+                                    rate=requested_sample_rate,
+                                    input=True,
+                                    input_device_index=device_index,
+                                    frames_per_buffer=chunk_size)
+            test_stream.close()
+            sample_rate = requested_sample_rate
+            log_debug(f"Using requested sample rate: {sample_rate} Hz for device", "audio_stream_source")
+        except OSError:
+            log_debug(f"Requested sample rate {requested_sample_rate} Hz not supported, trying alternatives...", "audio_stream_source")
+            # Try alternative sample rates if requested rate fails
+            sample_rates = [16000, 22050, 44100, 48000]
+            for rate in sample_rates:
+                if rate == requested_sample_rate:
+                    continue  # Skip the requested rate since it already failed
+                try:
+                    test_stream = audio.open(format=pyaudio.paInt16,
+                                            channels=channels,
+                                            rate=rate,
+                                            input=True,
+                                            input_device_index=device_index,
+                                            frames_per_buffer=chunk_size)
+                    test_stream.close()
+                    sample_rate = rate
+                    log_debug(f"Using alternative sample rate: {sample_rate} Hz for device", "audio_stream_source")
+                    break
+                except OSError:
+                    continue
     
     # Calculate how many chunks we need for the full duration
     chunk_duration = chunk_size / sample_rate  # seconds per chunk
     total_chunks = int(duration / chunk_duration)
     
-    print(f"DEBUG: Generating {total_chunks} chunks for {duration}s audio at {sample_rate}Hz", file=sys.stderr)
-    print(f"DEBUG: chunk_duration={chunk_duration}s, chunk_size={chunk_size} samples", file=sys.stderr)
+    log_debug(f"DEBUG: Generating {total_chunks} chunks for {duration}s audio at {sample_rate}Hz", "audio_stream_source")
+    log_debug(f"DEBUG: chunk_duration={chunk_duration}s, chunk_size={chunk_size} samples", "audio_stream_source")
+    log_debug(f"DEBUG: duration={duration}s, sample_rate={sample_rate}Hz", "audio_stream_source")
+    log_debug(f"DEBUG: total_chunks calculation: {duration} / {chunk_duration} = {total_chunks}", "audio_stream_source")
     
     # Collect all chunks for direct WAV file writing
     all_chunks = []
@@ -226,9 +272,11 @@ def audio_stream_source(data: Dict[str, Any], context=None):
         # Set up continuous recording with queue
         audio_queue = queue.Queue()
         recording_stop = threading.Event()
+        recording_error = None
         
         def record_audio_continuously():
             """Background thread that continuously records audio."""
+            nonlocal recording_error
             try:
                 if device_index is not None:
                     stream = audio.open(
@@ -248,7 +296,7 @@ def record_audio_continuously():
                         frames_per_buffer=chunk_size
                     )
                 
-                print(f"Started continuous recording from device {device_index}", file=sys.stderr)
+                log_debug(f"Started continuous recording from device {device_index}", "audio_stream_source")
                 
                 chunk_index = 0
                 while not recording_stop.is_set() and chunk_index < total_chunks:
@@ -256,77 +304,78 @@ def record_audio_continuously():
                         data = stream.read(chunk_size, exception_on_overflow=False)
                         audio_queue.put((chunk_index, data))
                         chunk_index += 1
+                        log_debug(f"DEBUG: Recording thread put chunk {chunk_index}/{total_chunks} in queue", "audio_stream_source")
+                        if chunk_index % 10 == 0:  # Log every 10th chunk
+                            log_debug(f"DEBUG: Recording thread recorded chunk {chunk_index}/{total_chunks}", "audio_stream_source")
                     except Exception as e:
-                        print(f"Recording error: {e}", file=sys.stderr)
+                        log_debug(f"Recording error: {e}", "audio_stream_source")
+                        recording_error = e
                         break
                 
                 stream.stop_stream()
                 stream.close()
-                print(f"Recording thread completed after {chunk_index} chunks", file=sys.stderr)
+                log_debug(f"Recording thread completed after {chunk_index} chunks", "audio_stream_source")
                 
             except Exception as e:
-                print(f"Failed to start recording: {e}", file=sys.stderr)
+                log_debug(f"Failed to start recording: {e}", "audio_stream_source")
+                recording_error = e
     
         # Start recording thread
         recording_thread = threading.Thread(target=record_audio_continuously, daemon=True)
         recording_thread.start()
         
-        print(f"DEBUG: Started continuous recording thread", file=sys.stderr)
+        log_debug(f"DEBUG: Started continuous recording thread", "audio_stream_source")
         
-        # Stream chunks as they become available
-        for chunk_index in range(total_chunks):
-            chunk_start_time = time.time()
-            print(f"TIMING: Waiting for chunk {chunk_index}/{total_chunks-1} at {chunk_start_time}", file=sys.stderr)
-            
+        # Process chunks from the recording thread
+        processed_chunks = 0
+        
+        while processed_chunks < total_chunks:
             try:
-                # Wait for chunk from recording thread (with timeout)
-                received_index, chunk_data = audio_queue.get(timeout=5.0)  # 5 second timeout
+                # Wait indefinitely for chunks - no timeout
+                chunk_index, chunk_data = audio_queue.get()
+                all_chunks.append((chunk_index, chunk_data))
                 
-                if received_index != chunk_index:
-                    print(f"WARNING: Expected chunk {chunk_index} but got {received_index}", file=sys.stderr)
+                # Determine if this is the final chunk
+                is_final = chunk_index >= total_chunks - 1
                 
-                audio_capture_time = time.time()
-                print(f"TIMING: Got chunk {chunk_index} from queue in {audio_capture_time - chunk_start_time:.4f}s", file=sys.stderr)
+                log_debug(f"DEBUG: Processing chunk {chunk_index}/{total_chunks}, processed={processed_chunks}, is_final={is_final}", "audio_stream_source")
                 
-            except queue.Empty:
-                print(f"ERROR: Timeout waiting for chunk {chunk_index}", file=sys.stderr)
-                # Generate silence as fallback
-                chunk_data = b'\x00' * (chunk_size * 2)  # 16-bit = 2 bytes per sample
-            
-            # Store chunk for WAV file writing
-            all_chunks.append(chunk_data)
-            
-            chunk_b64 = base64.b64encode(chunk_data).decode('utf-8')
-            is_final = chunk_index >= total_chunks - 1
-            
-            encoding_time = time.time()
-            print(f"TIMING: Base64 encoding took {encoding_time - audio_capture_time:.4f}s", file=sys.stderr)
-            
-            print(f"DEBUG: Yielding chunk {chunk_index}/{total_chunks-1}, is_final={is_final}", file=sys.stderr)
-            
-            yield {
-                "outcome": "streaming",
-                "stream_id": str(uuid.uuid4()),
-                "sample_rate": sample_rate,
-                "channels": channels,
-                "chunk_size": len(chunk_data),
-                "format": "pcm_16bit",
-                "chunk": chunk_b64,
-                "chunk_index": chunk_index,
-                "is_final": is_final
-            }
-            
-            chunk_end_time = time.time()
-            print(f"TIMING: Total chunk {chunk_index} processing took {chunk_end_time - chunk_start_time:.4f}s", file=sys.stderr)
-    
+                # Yield the chunk
+                yield {
+                    "outcome": "streaming",
+                    "stream_id": stream_id,
+                    "sample_rate": sample_rate,
+                    "channels": channels,
+                    "chunk_size": chunk_size,
+                    "format": "pcm_16bit",
+                    "chunk": base64.b64encode(chunk_data).decode('utf-8'),
+                    "chunk_index": chunk_index,
+                    "is_final": is_final,
+                    "output_file": output_file
+                }
+                
+                processed_chunks += 1
+                
+            except Exception as e:
+                log_debug(f"DEBUG: Error processing chunk {processed_chunks}: {e}", "audio_stream_source")
+                break
+        
+        log_debug(f"DEBUG: Main loop completed after processing {processed_chunks} chunks", "audio_stream_source")
+        
         # Stop recording
         recording_stop.set()
         recording_thread.join(timeout=2.0)
         
+        log_debug(f"DEBUG: Microphone recording loop completed. Processed {len(all_chunks)} chunks out of {total_chunks} expected.", "audio_stream_source")
+        
+        # Check for any recording errors after completion
+        if recording_error:
+            raise RuntimeError(f"Microphone recording failed: {recording_error}")
+        
     elif source_type == 'system_audio':
         # Similar implementation for system audio
         try:
-            source = AudioStreamSource(sample_rate, channels, chunk_size)
+            source = AudioStreamSource(sample_rate, channels, chunk_size, stream_id=stream_id)
             source.start_system_audio_stream()
             
             for chunk_index in range(total_chunks):
@@ -334,7 +383,7 @@ def record_audio_continuously():
                 chunk = source.get_system_audio_chunk()
                 
                 audio_capture_time = time.time()
-                print(f"TIMING: System audio capture took {audio_capture_time - chunk_start_time:.4f}s", file=sys.stderr)
+                log_debug(f"TIMING: System audio capture took {audio_capture_time - chunk_start_time:.4f}s", "audio_stream_source")
                 
                 all_chunks.append(chunk.data)
                 chunk_b64 = base64.b64encode(chunk.data).decode('utf-8')
@@ -342,20 +391,21 @@ def record_audio_continuously():
                 
                 yield {
                     "outcome": "streaming",
-                    "stream_id": chunk.stream_id,
+                    "stream_id": stream_id,
                     "sample_rate": chunk.sample_rate,
                     "channels": chunk.channels,
                     "chunk_size": len(chunk.data),
                     "format": "pcm_16bit",
                     "chunk": chunk_b64,
                     "chunk_index": chunk_index,
-                    "is_final": is_final
+                    "is_final": is_final,
+                    "output_file": output_file
                 }
         except Exception as e:
-            print(f"System audio capture failed: {e}. Falling back to sine wave.", file=sys.stderr)
-            source_type = 'sine_wave'
+            log_debug(f"System audio capture failed: {e}. Raising error instead of falling back.", "audio_stream_source")
+            raise RuntimeError(f"System audio capture failed: {e}")
     
-    if source_type == 'sine_wave':
+    elif source_type == 'sine_wave':
         # Generate sine wave chunks (no queue needed)
         source = AudioStreamSource(sample_rate, channels, chunk_size)
         
@@ -364,7 +414,7 @@ def record_audio_continuously():
             chunk = source.generate_sine_wave_chunk(frequency, chunk_duration)
             
             audio_capture_time = time.time()
-            print(f"TIMING: Sine wave generation took {audio_capture_time - chunk_start_time:.4f}s", file=sys.stderr)
+            log_debug(f"TIMING: Sine wave generation took {audio_capture_time - chunk_start_time:.4f}s", "audio_stream_source")
             
             all_chunks.append(chunk.data)
             chunk_b64 = base64.b64encode(chunk.data).decode('utf-8')
@@ -372,38 +422,26 @@ def record_audio_continuously():
             
             yield {
                 "outcome": "streaming",
-                "stream_id": chunk.stream_id,
+                "stream_id": stream_id,
                 "sample_rate": chunk.sample_rate,
                 "channels": chunk.channels,
                 "chunk_size": len(chunk.data),
                 "format": "pcm_16bit",
                 "chunk": chunk_b64,
                 "chunk_index": chunk_index,
-                "is_final": is_final
+                "is_final": is_final,
+                "output_file": output_file
             }
+    else:
+        raise ValueError(f"Unsupported audio source type: {source_type}. Supported types: microphone, system_audio, sine_wave")
     
-    print(f"DEBUG: Generator loop completed. Processed {len(all_chunks)} chunks.", file=sys.stderr)
+    log_debug(f"DEBUG: Generator loop completed. Processed {len(all_chunks)} chunks.", "audio_stream_source")
     
-    # Write WAV file directly when streaming completes
-    if all_chunks:
-        try:
-            print(f"DEBUG: Writing WAV file directly: {output_file}", file=sys.stderr)
-            all_audio_data = b''.join(all_chunks)
-            
-            with wave.open(output_file, 'wb') as wav_file:
-                wav_file.setnchannels(channels)
-                wav_file.setsampwidth(2)  # 16-bit
-                wav_file.setframerate(sample_rate)
-                wav_file.writeframes(all_audio_data)
-            
-            print(f"DEBUG: WAV file written successfully: {output_file} ({len(all_audio_data)} bytes)", file=sys.stderr)
-        except Exception as e:
-            print(f"ERROR: Failed to write WAV file {output_file}: {e}", file=sys.stderr)
-    else:
-        print(f"DEBUG: No chunks collected, skipping WAV file write", file=sys.stderr)
+    # Note: WAV file writing is now handled by the audio_sink component
+    # to ensure we write the processed audio, not just the source audio
     
     total_time = time.time() - start_time
-    print(f"TIMING: Total audio_stream_source execution took {total_time:.4f}s", file=sys.stderr)
+    log_debug(f"TIMING: Total audio_stream_source execution took {total_time:.4f}s", "audio_stream_source")
 
 
 def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
@@ -423,18 +461,35 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
     import time
     start_time = time.time()
     
-    chunk_b64 = data['chunk']
-    chunk_index = data.get('chunk_index', 0)
-    sample_rate = data.get('sample_rate', 16000)
-    channels = data.get('channels', 1)
-    operation = data.get('operation', 'analyze')
-    
-    print(f"TIMING: audio_chunk_processor starting chunk {chunk_index} at {start_time}", file=sys.stderr)
+    # Handle streaming chunk format - extract the actual chunk data
+    if 'outcome' in data and data['outcome'] == 'streaming':
+        # This is a streaming chunk, extract the chunk data
+        chunk_b64 = data.get('chunk', '')
+        chunk_index = data.get('chunk_index', 0)
+        sample_rate = data.get('sample_rate', 16000)
+        channels = data.get('channels', 1)
+        stream_id = data.get('stream_id', f'processed_{chunk_index}')
+        is_final = data.get('is_final', False)
+        operation = data.get('operation', 'passthrough')  # Default operation
+        # Pass through output_file from workflow input
+        output_file = data.get('output_file', 'output_audio.wav')
+    else:
+        # Direct input format
+        chunk_b64 = data.get('chunk', '')
+        chunk_index = data.get('chunk_index', 0)
+        sample_rate = data.get('sample_rate', 16000)
+        channels = data.get('channels', 1)
+        stream_id = data.get('stream_id', f'processed_{chunk_index}')
+        is_final = data.get('is_final', False)
+        operation = data.get('operation', 'passthrough')
+        output_file = data.get('output_file', 'output_audio.wav')
+    
+    log_debug(f"TIMING: audio_chunk_processor starting chunk {chunk_index} at {start_time}", "audio_chunk_processor")
     
     # Decode base64 chunk
     chunk_data = base64.b64decode(chunk_b64)
     decode_time = time.time()
-    print(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", file=sys.stderr)
+    log_debug(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", "audio_chunk_processor")
     
     # Convert bytes to samples
     samples = []
@@ -443,7 +498,7 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         samples.append(sample)
     
     convert_time = time.time()
-    print(f"TIMING: Sample conversion took {convert_time - decode_time:.4f}s", file=sys.stderr)
+    log_debug(f"TIMING: Sample conversion took {convert_time - decode_time:.4f}s", "audio_chunk_processor")
     
     if operation == "amplify":
         # Amplify the audio (multiply by gain factor)
@@ -455,18 +510,19 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         amplified_b64 = base64.b64encode(amplified_data).decode('utf-8')
         
         process_time = time.time()
-        print(f"TIMING: Amplification processing took {process_time - convert_time:.4f}s", file=sys.stderr)
+        log_debug(f"TIMING: Amplification processing took {process_time - convert_time:.4f}s", "audio_chunk_processor")
         
         result = {
             "outcome": "streaming",
-            "stream_id": data.get('stream_id', f"processed_{chunk_index}"),
+            "stream_id": stream_id,
             "sample_rate": sample_rate,
             "channels": channels,
             "operation": "amplify",
             "gain": gain,
             "chunk": amplified_b64,
             "chunk_index": chunk_index,
-            "is_final": data.get('is_final', False)
+            "is_final": is_final,
+            "output_file": output_file
         }
     
     elif operation == "analyze":
@@ -479,7 +535,7 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
             max_amplitude = avg_amplitude = rms = 0
         
         process_time = time.time()
-        print(f"TIMING: Analysis processing took {process_time - convert_time:.4f}s", file=sys.stderr)
+        log_debug(f"TIMING: Analysis processing took {process_time - convert_time:.4f}s", "audio_chunk_processor")
         
         result = {
             "outcome": "success",
@@ -491,24 +547,26 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
                 "rms": rms,
                 "sample_rate": sample_rate,
                 "channels": channels
-            }
+            },
+            "output_file": output_file
         }
     
     else:
         # Pass through unchanged
         result = {
             "outcome": "streaming",
-            "stream_id": data.get('stream_id', f"passthrough_{chunk_index}"),
+            "stream_id": stream_id,
             "sample_rate": sample_rate,
             "channels": channels,
             "operation": "passthrough",
             "chunk": chunk_b64,
             "chunk_index": chunk_index,
-            "is_final": data.get('is_final', False)
+            "is_final": is_final,
+            "output_file": output_file
         }
     
     total_time = time.time() - start_time
-    print(f"TIMING: audio_chunk_processor total time for chunk {chunk_index}: {total_time:.4f}s", file=sys.stderr)
+    log_debug(f"TIMING: audio_chunk_processor total time for chunk {chunk_index}: {total_time:.4f}s", "audio_chunk_processor")
     
     return result
 
@@ -530,19 +588,56 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
     import time
     start_time = time.time()
     
-    chunk_b64 = data.get('chunk', '')
-    chunk_index = data.get('chunk_index', 0)
-    stream_id = data.get('stream_id', 'unknown')
-    output_file = data.get('output_file', 'output_audio.wav')
-    play_audio = data.get('play_audio', False)
-    
-    print(f"TIMING: audio_sink starting chunk {chunk_index} at {start_time}", file=sys.stderr)
+    # Global storage for accumulating chunks across function calls
+    if not hasattr(audio_sink, '_chunk_storage'):
+        audio_sink._chunk_storage = {}
+    
+    # Handle streaming chunk format - extract the actual chunk data
+    if 'outcome' in data and data['outcome'] == 'streaming':
+        # This is a streaming chunk, extract the chunk data
+        chunk_b64 = data.get('chunk', '')
+        chunk_index = data.get('chunk_index', 0)
+        stream_id = data.get('stream_id', 'unknown')
+        sample_rate = data.get('sample_rate', 16000)
+        channels = data.get('channels', 1)
+        is_final = data.get('is_final', False)
+        # For streaming chunks, get output_file from the data (passed from workflow)
+        output_file = data.get('output_file', 'output_audio.wav')
+        play_audio = data.get('play_audio', False)
+    else:
+        # Direct input format
+        chunk_b64 = data.get('chunk', '')
+        chunk_index = data.get('chunk_index', 0)
+        stream_id = data.get('stream_id', 'unknown')
+        sample_rate = data.get('sample_rate', 16000)
+        channels = data.get('channels', 1)
+        is_final = data.get('is_final', False)
+        output_file = data.get('output_file', 'output_audio.wav')
+        play_audio = data.get('play_audio', False)
+    
+    log_debug(f"TIMING: audio_sink starting chunk {chunk_index} at {start_time}", "audio_sink")
+    log_debug(f"DEBUG: audio_sink output_file: {output_file}", "audio_sink")
+    log_debug(f"DEBUG: audio_sink is_final: {is_final}", "audio_sink")
+    log_debug(f"DEBUG: audio_sink stream_id: {stream_id}", "audio_sink")
     
     # Decode the chunk
     if chunk_b64:
         chunk_data = base64.b64decode(chunk_b64)
         decode_time = time.time()
-        print(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", file=sys.stderr)
+        log_debug(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", "audio_sink")
+        
+        # Store the chunk for later writing
+        if stream_id not in audio_sink._chunk_storage:
+            audio_sink._chunk_storage[stream_id] = {
+                'chunks': [],
+                'sample_rate': sample_rate,
+                'channels': channels,
+                'output_file': output_file
+            }
+        
+        audio_sink._chunk_storage[stream_id]['chunks'].append(chunk_data)
+        
+        log_debug(f"DEBUG: Stored chunk {chunk_index} for stream {stream_id}, total chunks: {len(audio_sink._chunk_storage[stream_id]['chunks'])}", "audio_sink")
         
         # Convert to samples for analysis
         samples = []
@@ -559,7 +654,7 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
             max_amplitude = avg_amplitude = rms = 0
         
         analysis_time = time.time()
-        print(f"TIMING: Audio analysis took {analysis_time - decode_time:.4f}s", file=sys.stderr)
+        log_debug(f"TIMING: Audio analysis took {analysis_time - decode_time:.4f}s", "audio_sink")
         
         # Play audio if requested
         if play_audio:
@@ -571,16 +666,46 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
                 audio_array = np.array(samples, dtype=np.int16)
                 
                 # Play the audio
-                sd.play(audio_array, samplerate=data.get('sample_rate', 16000))
+                sd.play(audio_array, samplerate=sample_rate)
                 sd.wait()
                 
                 play_time = time.time()
-                print(f"TIMING: Audio playback took {play_time - analysis_time:.4f}s", file=sys.stderr)
+                log_debug(f"TIMING: Audio playback took {play_time - analysis_time:.4f}s", "audio_sink")
                 
             except ImportError:
-                print("WARNING: sounddevice not available, skipping audio playback", file=sys.stderr)
+                log_debug("WARNING: sounddevice not available, skipping audio playback", "audio_sink")
+            except Exception as e:
+                log_debug(f"ERROR: Audio playback failed: {e}", "audio_sink")
+        
+        # Write WAV file if this is the final chunk
+        if is_final and stream_id in audio_sink._chunk_storage:
+            try:
+                log_debug(f"DEBUG: Writing final WAV file: {output_file}", "audio_sink")
+                storage = audio_sink._chunk_storage[stream_id]
+                all_audio_data = b''.join(storage['chunks'])
+                
+                # Ensure the output directory exists
+                output_dir = os.path.dirname(output_file)
+                if output_dir and not os.path.exists(output_dir):
+                    log_debug(f"DEBUG: Creating output directory: {output_dir}", "audio_sink")
+                    os.makedirs(output_dir, exist_ok=True)
+                
+                log_debug(f"DEBUG: Writing {len(all_audio_data)} bytes to {output_file}", "audio_sink")
+                with wave.open(output_file, 'wb') as wav_file:
+                    wav_file.setnchannels(storage['channels'])
+                    wav_file.setsampwidth(2)  # 16-bit
+                    wav_file.setframerate(storage['sample_rate'])
+                    wav_file.writeframes(all_audio_data)
+                
+                log_debug(f"DEBUG: WAV file written successfully: {output_file} ({len(all_audio_data)} bytes)", "audio_sink")
+                
+                # Clean up storage for this stream
+                del audio_sink._chunk_storage[stream_id]
+                
             except Exception as e:
-                print(f"ERROR: Audio playback failed: {e}", file=sys.stderr)
+                log_debug(f"ERROR: Failed to write WAV file {output_file}: {e}", "audio_sink")
+                import traceback
+                traceback.print_exc(file=sys.stderr)
         
         result = {
             "outcome": "success",
@@ -592,7 +717,9 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
                 "rms": rms,
                 "sample_count": len(samples),
                 "chunk_size_bytes": len(chunk_data),
-                "output_file": output_file
+                "output_file": output_file,
+                "is_final": is_final,
+                "total_chunks_stored": len(audio_sink._chunk_storage.get(stream_id, {}).get('chunks', []))
             }
         }
     else:
@@ -606,6 +733,6 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         }
     
     total_time = time.time() - start_time
-    print(f"TIMING: audio_sink total time for chunk {chunk_index}: {total_time:.4f}s", file=sys.stderr)
+    log_debug(f"TIMING: audio_sink total time for chunk {chunk_index}: {total_time:.4f}s", "audio_sink")
     
     return result 
\ No newline at end of file
diff --git a/sdks/python/src/stepflow_sdk/protocol.py b/sdks/python/src/stepflow_sdk/protocol.py
index 043d6ed7..af2b87b6 100644
--- a/sdks/python/src/stepflow_sdk/protocol.py
+++ b/sdks/python/src/stepflow_sdk/protocol.py
@@ -30,6 +30,8 @@ class ComponentInfoResponse(Struct, kw_only=True):
 class ComponentExecuteRequest(Struct, kw_only=True):
     component: str
     input: msgspec.Raw
+    execution_id: str
+    step_id: str
 
 class ComponentExecuteResponse(Struct, kw_only=True):
     output: Any
\ No newline at end of file
diff --git a/sdks/python/src/stepflow_sdk/server.py b/sdks/python/src/stepflow_sdk/server.py
index b49b7d59..dbfb2cc4 100644
--- a/sdks/python/src/stepflow_sdk/server.py
+++ b/sdks/python/src/stepflow_sdk/server.py
@@ -161,17 +161,31 @@ async def _handle_method_request(self, request: Message) -> Message | None:
                         # For generators, we need to yield each result as streaming
                         if inspect.isgenerator(output):
                             results = []
+                            chunk_index = 0
                             for result in output:
                                 results.append(result)
-                                # Send streaming notification
-                                await self._outgoing_queue.put({
+                                is_final = False  # We'll mark the last chunk as final later if needed
+                                
+                                # Send streaming notification immediately via stdout instead of queuing
+                                streaming_notification = {
                                     "jsonrpc": "2.0",
                                     "method": "streaming_chunk",
                                     "params": {
-                                        "request_id": str(id),
+                                        "request_id": str(execute_request.execution_id),
+                                        "stream_id": str(execute_request.execution_id),
+                                        "chunk_index": chunk_index,
+                                        "is_final": is_final,
+                                        "step_id": execute_request.step_id,
                                         "chunk": result
                                     }
-                                })
+                                }
+                                # Send immediately via stdout
+                                notification_bytes = msgspec.json.encode(streaming_notification) + b"\n"
+                                sys.stdout.buffer.write(notification_bytes)
+                                sys.stdout.buffer.flush()
+                                print(f"Sent outgoing message", file=sys.stderr)
+                                
+                                chunk_index += 1
                             
                             # Return the final result (last chunk)
                             if results:
@@ -179,12 +193,6 @@ async def _handle_method_request(self, request: Message) -> Message | None:
                                     id=id,
                                     result=ComponentExecuteResponse(output=results[-1]),
                                 )
-                            else:
-                                # Empty generator
-                                return Message(
-                                    id=id,
-                                    result=ComponentExecuteResponse(output={"outcome": "success", "result": None}),
-                                )
                         else:
                             # Not actually a generator, treat as normal
                             return Message(
@@ -366,7 +374,10 @@ async def _send_outgoing_message(self, message_data, writer: asyncio.StreamWrite
             message_bytes = msgspec.json.encode(message_data) + b"\n"
             writer.write(message_bytes)
             await writer.drain()
-            print(f"Sent outgoing message: {message_data}", file=sys.stderr)
+            # Ensure the message is fully written and flushed
+            if hasattr(writer, '_transport') and hasattr(writer._transport, 'flush'):
+                writer._transport.flush()
+            print(f"Sent outgoing message", file=sys.stderr)
         except Exception as e:
             print(f"Error sending outgoing message: {e}", file=sys.stderr)
     

From 42f6eac6277fadb6b2e558257d56f574d4374d18 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Thu, 26 Jun 2025 00:23:08 -0400
Subject: [PATCH 09/14] loggin

---
 crates/stepflow-execution/src/workflow_executor.rs | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index e487cec0..1c9e700e 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -114,6 +114,7 @@ impl WorkflowExecutor {
                     pipeline_steps.iter().map(|i| (*i, &flow.steps[*i].id, &flow.steps[*i].component)).collect::<Vec<_>>()
                 );
                 
+                tracing::info!("[DEBUG-INIT] Creating streaming coordinator in WorkflowExecutor::new");
                 let coordinator = StreamingPipelineCoordinator::new(
                     executor.clone(),
                     flow.clone(),
@@ -1477,13 +1478,18 @@ impl StreamingPipelineCoordinator {
             for &step_idx in &pipeline_steps {
                 let step_id = flow.steps[step_idx].id.clone();
                 
-                // Take sender & receiver out now, before spawning
+                // Take the receiver for this step - this is the correct approach
+                // The sender stays in the coordinator so route_chunk_to_running_pipeline can send to it
                 let rx = guard.step_receivers.remove(&step_id).ok_or_else(|| {
+                    tracing::error!("[DEBUG-CHANNEL] No receiver found for step {}", step_id);
                     ExecutionError::Internal
                 })?;
+                tracing::info!("[DEBUG-CHANNEL] Moved receiver for step {} to task", step_id);
                 let _sender = guard.step_senders.get(&step_id).unwrap().clone(); // Keep sender in map for handle_chunk
                 let downstream = guard.step_downstream_senders
                     .get(&step_id).cloned().unwrap_or_default();
+                
+                tracing::info!("[DEBUG-CHANNEL] Step {} spawning with {} downstream channels", step_id, downstream.len());
                 let input = step_inputs.remove(&step_idx).ok_or_else(|| {
                     ExecutionError::Internal
                 })?;
@@ -1708,6 +1714,9 @@ async fn run_streaming_step_simple(
                 
                 // Forward to downstream steps
                 stream_log!(info, &step_id, "forwarding chunk #{} to {} downstream", final_chunk_index, downstream.len());
+                if downstream.is_empty() {
+                    stream_log!(warn, &step_id, "no downstream channels to forward to!");
+                }
                 for (i, tx) in downstream.iter().enumerate() {
                     match tx.send(FlowResult::Streaming {
                         stream_id: final_stream_id.clone(),

From 4380087a189d43a6648f5dd5af29634ccd60e87d Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Thu, 26 Jun 2025 09:41:38 -0400
Subject: [PATCH 10/14] WIP

---
 crates/stepflow-execution/src/executor.rs     |  23 +-
 .../src/workflow_executor.rs                  | 200 +++++++++++++-----
 crates/stepflow-main/src/error.rs             |   2 +
 crates/stepflow-main/src/repl.rs              | 101 ++++++---
 crates/stepflow-server/src/api/debug.rs       |  19 +-
 5 files changed, 251 insertions(+), 94 deletions(-)

diff --git a/crates/stepflow-execution/src/executor.rs b/crates/stepflow-execution/src/executor.rs
index 463e7cb2..a4becd33 100644
--- a/crates/stepflow-execution/src/executor.rs
+++ b/crates/stepflow-execution/src/executor.rs
@@ -108,13 +108,13 @@ impl StepFlowExecutor {
     }
 
     /// Get or create a debug session for step-by-step execution control
-    pub async fn debug_session(&self, execution_id: Uuid) -> Result<WorkflowExecutor> {
+    pub async fn debug_session(&self, execution_id: Uuid) -> Result<Arc<tokio::sync::Mutex<WorkflowExecutor>>> {
         // Check if session already exists
         {
             let sessions = self.debug_sessions.read().await;
-            if let Some(_session) = sessions.get(&execution_id) {
-                // Return a clone of the session (WorkflowExecutor should implement Clone if needed)
-                // For now, we'll create a new session each time since WorkflowExecutor is not Clone
+            if let Some(session) = sessions.get(&execution_id) {
+                tracing::info!("Reusing existing WorkflowExecutor for debug session: {}", execution_id);
+                return Ok(session.clone());
             }
         }
 
@@ -148,7 +148,14 @@ impl StepFlowExecutor {
             self.state_store.clone(),
         )?;
 
-        Ok(workflow_executor)
+        // Store the executor for future reuse
+        let executor_arc = Arc::new(tokio::sync::Mutex::new(workflow_executor));
+        {
+            let mut sessions = self.debug_sessions.write().await;
+            sessions.insert(execution_id, executor_arc.clone());
+        }
+
+        Ok(executor_arc)
     }
 
     /// Get a workflow executor for debug sessions
@@ -166,6 +173,12 @@ impl StepFlowExecutor {
         // For now, return None since we don't have access to the flow
         None
     }
+
+    /// Get an existing debug session without creating a new one
+    pub async fn get_debug_session(&self, execution_id: Uuid) -> Option<Arc<tokio::sync::Mutex<WorkflowExecutor>>> {
+        let sessions = self.debug_sessions.read().await;
+        sessions.get(&execution_id).cloned()
+    }
 }
 
 impl Context for StepFlowExecutor {
diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index 1c9e700e..0032f275 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -32,16 +32,28 @@ pub(crate) async fn execute_workflow(
     input: ValueRef,
     state_store: Arc<dyn StateStore>,
 ) -> Result<FlowResult> {
-    let mut workflow_executor = WorkflowExecutor::new(
-        executor,
-        flow,
-        workflow_hash,
-        execution_id,
-        input,
-        state_store,
-    )?;
-
-    workflow_executor.execute_to_completion().await
+    // Check if there's already a debug session for this execution ID
+    let existing_debug_session = executor.get_debug_session(execution_id).await;
+    
+    if let Some(debug_session) = existing_debug_session {
+        // Use the existing debug session
+        tracing::info!("Using existing debug session for execution ID: {}", execution_id);
+        let mut workflow_executor = debug_session.lock().await;
+        workflow_executor.execute_to_completion().await
+    } else {
+        // Create a new workflow executor
+        tracing::info!("Executing workflow using tracker-based execution");
+        let mut workflow_executor = WorkflowExecutor::new(
+            executor,
+            flow,
+            workflow_hash,
+            execution_id,
+            input,
+            state_store,
+        )?;
+
+        workflow_executor.execute_to_completion().await
+    }
 }
 
 /// Workflow executor that manages the execution of a single workflow.
@@ -1288,55 +1300,100 @@ impl StreamingPipelineCoordinator {
     /// Route chunks to the running pipeline without requiring mutable access to the coordinator
     /// This allows chunks to be routed while the receivers are moved out for step tasks
     pub async fn route_chunk_to_running_pipeline(
-        coord_arc: Arc<tokio::sync::Mutex<Self>>,
+        coord_arc: Arc<tokio::sync::Mutex<StreamingPipelineCoordinator>>,
         chunk_json: serde_json::Value,
     ) -> Result<()> {
         let map = serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk_json)
             .map_err(|e| ExecutionError::MalformedReference { message: e.to_string() })?;
         
+        // Extract chunk metadata
+        let chunk_index = map.get("chunk_index")
+                             .and_then(|v| v.as_u64())
+                             .unwrap_or(0) as usize;
+        
+        let is_final = map.get("is_final")
+                          .and_then(|v| v.as_bool())
+                          .unwrap_or(false);
+        
+        // Extract the step ID this chunk came FROM
+        let source_step_id = if let Some(step_id) = map.get("step_id").and_then(|v| v.as_str()) {
+            step_id.to_string()
+        } else {
+            // Default to first step if no step_id provided
+            let coord = coord_arc.lock().await;
+            let first_step_idx = coord.pipeline_steps[0];
+            let first_step_id = coord.flow.steps[first_step_idx].id.clone();
+            tracing::info!("No step_id in chunk, defaulting to first pipeline step: {}", first_step_id);
+            drop(coord); // Release the lock early
+            first_step_id
+        };
+        
         let coord = coord_arc.lock().await;
         
-        // Extract the step ID this chunk belongs to (default to first pipeline step)
-        let step_id = map.get("step_id")
-                          .and_then(|v| v.as_str())
-                          .map(|s| s.to_string())
-                          .unwrap_or_else(|| {
-                              // Default to first step (source step) if no step_id provided
-                              let first_step_idx = coord.pipeline_steps[0];
-                              let first_step_id = coord.flow.steps[first_step_idx].id.clone();
-                              tracing::info!("No step_id in chunk, defaulting to first pipeline step: {}", first_step_id);
-                              first_step_id
-                          });
-                          
-        let stream_id   = map.get("stream_id")  .and_then(|v| v.as_str()).unwrap_or_default().to_string();
-        let chunk_index = map.get("chunk_index").and_then(|v| v.as_u64()).unwrap_or(0) as usize;
-        let is_final    = map.get("is_final")   .and_then(|v| v.as_bool()).unwrap_or(false);
-
-        // Build the FlowResult
-        let fr = FlowResult::Streaming {
-            stream_id: stream_id.clone(),
-            metadata: stepflow_core::workflow::ValueRef::new(serde_json::Value::Object(map.clone())),
-            chunk: map.get("chunk").and_then(|v|v.as_str()).unwrap_or("").to_string(),
-            chunk_index,
-            is_final,
+        // Find the index of the source step in the pipeline
+        let source_step_pipeline_index = coord.pipeline_steps.iter()
+            .enumerate()
+            .find_map(|(i, &step_idx)| {
+                if coord.flow.steps[step_idx].id == source_step_id {
+                    Some(i)
+                } else {
+                    None
+                }
+            });
+        
+        // Find the next step in the pipeline (if any)
+        let target_step_id = if let Some(source_idx) = source_step_pipeline_index {
+            if source_idx + 1 < coord.pipeline_steps.len() {
+                // Get the next step in the pipeline
+                let next_step_idx = coord.pipeline_steps[source_idx + 1];
+                let next_step_id = coord.flow.steps[next_step_idx].id.clone();
+                tracing::info!("Routing chunk from step {} to next step {}", source_step_id, next_step_id);
+                next_step_id
+            } else {
+                // This is the last step in the pipeline, no forwarding needed
+                tracing::info!("Step {} is the last in pipeline, no forwarding needed", source_step_id);
+                return Ok(());
+            }
+        } else {
+            // Couldn't find the source step in the pipeline, use the source step ID as fallback
+            tracing::warn!("Could not find step {} in pipeline, using as target", source_step_id);
+            source_step_id.clone()
         };
-
-        // Send to the step's channel (only if the sender still exists)
-        if let Some(tx) = coord.step_senders.get(&step_id) {
-            tracing::info!("Found sender for step {}, attempting to send chunk {}", step_id, chunk_index);
-            tracing::info!("HANDLE_CHUNK step={} idx={} final={}", step_id, chunk_index, is_final);
-            tracing::debug!("send -> {} (buffer={})", step_id, tx.capacity());
+        
+        // Send to the target step's channel
+        if let Some(tx) = coord.step_senders.get(&target_step_id) {
+            tracing::info!("[SEND-DEBUG] Found sender for target step {}, attempting to send chunk {} (tx addr: {:p})", 
+                          target_step_id, chunk_index, tx);
+            
+            // Create a FlowResult from the chunk data
+            let fr = FlowResult::Streaming {
+                stream_id: map.get("stream_id")
+                             .and_then(|v| v.as_str())
+                             .unwrap_or("unknown")
+                             .to_string(),
+                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!(map)),
+                chunk: map.get("chunk")
+                         .and_then(|v| v.as_str())
+                         .unwrap_or("")
+                         .to_string(),
+                chunk_index,
+                is_final,
+            };
+            
             match tx.send(fr.clone()).await {
                 Ok(_) => {
-                    tracing::info!("Successfully routed chunk {} to step {} (pipeline steps: {:?})", chunk_index, step_id, coord.pipeline_steps);
+                    tracing::info!("[SEND-DEBUG] Successfully routed chunk {} from step {} to step {}", 
+                                  chunk_index, source_step_id, target_step_id);
                 }
                 Err(e) => {
-                    tracing::error!("Failed to route chunk {} to step {}: {:?}", chunk_index, step_id, e);
-                    return Err(ExecutionError::StepFailed { step: step_id.clone() }.into());
+                    tracing::error!("[SEND-DEBUG] Failed to send chunk {} to step {}: {:?}", 
+                                   chunk_index, target_step_id, e);
+                    return Err(ExecutionError::StepFailed { step: target_step_id.clone() }.into());
                 }
             }
         } else {
-            tracing::warn!("No channel for step {} (available steps: {:?})", step_id, coord.step_senders.keys().collect::<Vec<_>>());
+            tracing::warn!("[SEND-DEBUG] No channel for target step {} (available steps: {:?})", 
+                          target_step_id, coord.step_senders.keys().collect::<Vec<_>>());
         }
 
         Ok(())
@@ -1411,10 +1468,18 @@ impl StreamingPipelineCoordinator {
             let step_id = flow.steps[step_index].id.clone();
             let (input_tx, input_rx) = tokio::sync::mpsc::channel(100);
             let sender_clone = input_tx.clone();
+            
+            // Log channel creation with memory addresses
+            tracing::info!(
+                "[CHANNEL-DEBUG] Created channel for step {} (index {}): tx={:p}, rx={:p}", 
+                step_id, 
+                step_index, 
+                &sender_clone as *const _,
+                &input_rx as *const _
+            );
+            
             step_senders.insert(step_id.clone(), sender_clone);
             step_receivers.insert(step_id.clone(), input_rx);
-            tracing::info!("[DEBUG-CHANNEL] Created channel for step {} (index {}) - receiver capacity: {}", 
-                         step_id, step_index, 100);
         }
 
         // Set up the pipeline connections
@@ -1657,8 +1722,38 @@ async fn run_streaming_step_simple(
     
     loop {
         tracing::info!("[STREAM] Step {} waiting for chunk via receiver", step_id);
-        let recv_result = rx.recv().await;
-        tracing::info!("[STREAM] Step {} received result from rx.recv(): {:?}", step_id, recv_result.is_some());
+        // Before waiting for data, log channel details
+        tracing::info!(
+            "[STREAM-DEBUG] Step {} waiting for chunk via receiver (rx addr: {:p})", 
+            step_id, 
+            &rx as *const _
+        );
+
+        // Check if the channel has been closed already
+        if rx.is_closed() {
+            stream_log!(warn, &step_id, "channel is already closed before receiving any data");
+        }
+
+        // Add timeout to prevent indefinite blocking
+        let recv_result = match tokio::time::timeout(
+            std::time::Duration::from_secs(10), // 10 second timeout
+            rx.recv()
+        ).await {
+            Ok(result) => {
+                tracing::info!(
+                    "[STREAM-DEBUG] Step {} received data from channel: is_some={}", 
+                    step_id, 
+                    result.is_some()
+                );
+                result
+            },
+            Err(_) => {
+                stream_log!(warn, &step_id, "TIMEOUT waiting for chunk after 10 seconds");
+                // Continue with loop to try again or return None to exit
+                None
+            }
+        };
+
         match recv_result {
             Some(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final }) => {
                 stream_log!(info, &step_id, "RECEIVED chunk #{} from receiver", chunk_index);
@@ -1895,7 +1990,7 @@ mod tests {
     pub async fn create_workflow_from_yaml_simple(
         yaml_str: &str,
         mock_behaviors: Vec<(&str, FlowResult)>,
-    ) -> (Arc<crate::executor::StepFlowExecutor>, Arc<Flow>, FlowHash) {
+    ) {
         // Parse the YAML workflow
         let flow: Flow = serde_yaml_ng::from_str(yaml_str).expect("Failed to parse YAML workflow");
         let flow = Arc::new(flow);
@@ -2112,6 +2207,7 @@ output:
                 .await
                 .unwrap();
 
+        // Check the final result
         match result {
             FlowResult::Success { result } => {
                 assert_eq!(result.as_ref(), &json!({"final": 30}));
@@ -2232,7 +2328,6 @@ output:
 "#;
 
         let workflow_input = json!({"value": 42});
-        let step1_output = json!({"step1": "done"});
         let step2_output = json!({"step2": "done"});
         let final_output = json!({"both": "completed"});
 
@@ -2542,8 +2637,3 @@ output:
     }
 }
 
-
-
-
-
-
diff --git a/crates/stepflow-main/src/error.rs b/crates/stepflow-main/src/error.rs
index a0f3f38b..c98ed978 100644
--- a/crates/stepflow-main/src/error.rs
+++ b/crates/stepflow-main/src/error.rs
@@ -36,6 +36,8 @@ pub enum MainError {
     ReplCommand(String),
     #[error("Configuration error")]
     Configuration,
+    #[error("No active debug session")]
+    NoDebugSession,
 }
 
 pub type Result<T, E = error_stack::Report<MainError>> = std::result::Result<T, E>;
diff --git a/crates/stepflow-main/src/repl.rs b/crates/stepflow-main/src/repl.rs
index e1485f0b..421ede39 100644
--- a/crates/stepflow-main/src/repl.rs
+++ b/crates/stepflow-main/src/repl.rs
@@ -4,7 +4,7 @@ use error_stack::ResultExt as _;
 use rustyline::{DefaultEditor, error::ReadlineError};
 use std::{path::PathBuf, sync::Arc};
 use stepflow_core::workflow::{Flow, FlowHash, ValueRef};
-use stepflow_execution::{StepFlowExecutor, WorkflowExecutor};
+use stepflow_execution::{StepExecutionResult, StepFlowExecutor, WorkflowExecutor};
 use stepflow_plugin::Context as _;
 
 use crate::{
@@ -19,7 +19,8 @@ pub struct LastRun {
     pub workflow_hash: FlowHash,
     pub workflow_path: PathBuf,
     pub input: ValueRef,
-    pub last_execution: Option<WorkflowExecutor>,
+    pub last_execution: Option<Arc<tokio::sync::Mutex<WorkflowExecutor>>>,
+    pub execution_id: Option<uuid::Uuid>,
 }
 
 impl LastRun {
@@ -35,6 +36,7 @@ impl LastRun {
             workflow_path,
             input,
             last_execution: None,
+            execution_id: None,
         }
     }
 
@@ -66,32 +68,46 @@ impl LastRun {
     pub async fn create_debug_execution(
         &mut self,
         executor: &Arc<StepFlowExecutor>,
-    ) -> Result<&mut WorkflowExecutor> {
-        let state_store = executor.state_store();
+    ) -> Result<()> {
         let execution_id = uuid::Uuid::new_v4();
-        let workflow_executor = WorkflowExecutor::new(
-            executor.clone(),
+        
+        // Submit the workflow to get it registered
+        executor.submit_flow(
             self.workflow.clone(),
             self.workflow_hash.clone(),
-            execution_id,
             self.input.clone(),
-            state_store.clone(),
-        )
-        .change_context(MainError::FlowExecution)?;
-
-        self.last_execution = Some(workflow_executor);
-        Ok(self.last_execution.as_mut().unwrap())
+        ).await.change_context(MainError::FlowExecution)?;
+        
+        // Get the debug session executor
+        let debug_executor = executor.debug_session(execution_id)
+            .await
+            .change_context(MainError::FlowExecution)?;
+        
+        // Store the execution ID for later reference
+        self.execution_id = Some(execution_id);
+        
+        // Store the executor
+        self.last_execution = Some(debug_executor);
+        
+        Ok(())
     }
 
     /// Get the current debug execution, if any
-    pub fn debug_execution(&mut self) -> Option<&mut WorkflowExecutor> {
-        self.last_execution.as_mut()
+    pub async fn execute_step(&mut self, step_id: &str) -> Result<StepExecutionResult> {
+        if let Some(executor) = &self.last_execution {
+            let mut workflow_executor = executor.lock().await;
+            workflow_executor.execute_step_by_id(step_id).await
+                .change_context(MainError::FlowExecution)
+        } else {
+            Err(error_stack::report!(MainError::NoDebugSession))
+        }
     }
 
     /// Update input and clear any existing execution
     pub fn update_input(&mut self, input: ValueRef) {
         self.input = input;
-        self.last_execution = None; // Clear execution since input changed
+        self.last_execution = None;
+        self.execution_id = None;
     }
 }
 
@@ -386,7 +402,10 @@ async fn handle_steps_command(state: &ReplState) -> Result<()> {
 
     if let Some(last_run) = &state.last_run {
         if let Some(debug_session) = &last_run.last_execution {
-            let all_steps = debug_session.list_all_steps().await;
+            // Lock the mutex to access the WorkflowExecutor
+            let workflow_executor = debug_session.lock().await;
+            
+            let all_steps = workflow_executor.list_all_steps().await;
             println!("Workflow steps ({} total):", all_steps.len());
             for step_status in &all_steps {
                 println!(
@@ -421,7 +440,10 @@ async fn handle_runnable_command(state: &ReplState) -> Result<()> {
 
     if let Some(last_run) = &state.last_run {
         if let Some(debug_session) = &last_run.last_execution {
-            let runnable_steps = debug_session.get_runnable_steps().await;
+            // Lock the mutex to access the WorkflowExecutor
+            let workflow_executor = debug_session.lock().await;
+            
+            let runnable_steps = workflow_executor.get_runnable_steps().await;
             if runnable_steps.is_empty() {
                 println!(
                     "No steps are currently runnable. All dependencies may be satisfied or workflow is complete."
@@ -458,8 +480,11 @@ async fn handle_run_step_command(step_id: String, state: &mut ReplState) -> Resu
     }
 
     if let Some(last_run) = &mut state.last_run {
-        if let Some(debug_session) = last_run.debug_execution() {
-            match debug_session.execute_step_by_id(&step_id).await {
+        if let Some(debug_session) = &last_run.last_execution {
+            // Lock the mutex to access the WorkflowExecutor
+            let mut workflow_executor = debug_session.lock().await;
+            
+            match workflow_executor.execute_step_by_id(&step_id).await {
                 Ok(result) => {
                     print_step_result(&step_id, &result.result)?;
                 }
@@ -490,8 +515,11 @@ async fn handle_run_steps_command(step_ids: Vec<String>, state: &mut ReplState)
     }
 
     if let Some(last_run) = &mut state.last_run {
-        if let Some(debug_session) = last_run.debug_execution() {
-            match debug_session.execute_steps(&step_ids).await {
+        if let Some(debug_session) = &last_run.last_execution {
+            // Lock the mutex to access the WorkflowExecutor
+            let mut workflow_executor = debug_session.lock().await;
+            
+            match workflow_executor.execute_steps(&step_ids).await {
                 Ok(results) => {
                     println!("Executed {} steps:", results.len());
                     for result in results {
@@ -525,8 +553,11 @@ async fn handle_run_all_command(state: &mut ReplState) -> Result<()> {
     }
 
     if let Some(last_run) = &mut state.last_run {
-        if let Some(debug_session) = last_run.debug_execution() {
-            match debug_session.execute_all_runnable().await {
+        if let Some(debug_session) = &last_run.last_execution {
+            // Lock the mutex to access the WorkflowExecutor
+            let mut workflow_executor = debug_session.lock().await;
+            
+            match workflow_executor.execute_all_runnable().await {
                 Ok(results) => {
                     if results.is_empty() {
                         println!("No runnable steps to execute.");
@@ -564,9 +595,12 @@ async fn handle_continue_command(state: &mut ReplState) -> Result<()> {
     }
 
     if let Some(last_run) = &mut state.last_run {
-        if let Some(debug_session) = last_run.debug_execution() {
+        if let Some(debug_session) = &last_run.last_execution {
+            // Lock the mutex to access the WorkflowExecutor
+            let mut workflow_executor = debug_session.lock().await;
+            
             println!("Continuing workflow execution to completion...");
-            match debug_session.execute_to_completion().await {
+            match workflow_executor.execute_to_completion().await {
                 Ok(final_result) => {
                     // Print final result
                     let result_json = serde_json::to_string_pretty(&final_result)
@@ -616,7 +650,10 @@ async fn handle_inspect_command(step_id: String, state: &ReplState) -> Result<()
 
     if let Some(last_run) = &state.last_run {
         if let Some(debug_session) = &last_run.last_execution {
-            match debug_session.inspect_step(&step_id).await {
+            // Lock the mutex to access the WorkflowExecutor
+            let workflow_executor = debug_session.lock().await;
+            
+            match workflow_executor.inspect_step(&step_id).await {
                 Ok(inspection) => {
                     println!("Step '{}' inspection:", step_id);
                     println!("  Index: {}", inspection.metadata.step_index);
@@ -663,7 +700,10 @@ async fn handle_completed_command(state: &ReplState) -> Result<()> {
 
     if let Some(last_run) = &state.last_run {
         if let Some(debug_session) = &last_run.last_execution {
-            match debug_session.get_completed_steps().await {
+            // Lock the mutex to access the WorkflowExecutor
+            let workflow_executor = debug_session.lock().await;
+            
+            match workflow_executor.get_completed_steps().await {
                 Ok(completed_steps) => {
                     if completed_steps.is_empty() {
                         println!("No steps have been completed yet.");
@@ -714,7 +754,10 @@ async fn handle_output_command(step_id: String, state: &ReplState) -> Result<()>
 
     if let Some(last_run) = &state.last_run {
         if let Some(debug_session) = &last_run.last_execution {
-            match debug_session.get_step_output(&step_id).await {
+            // Lock the mutex to access the WorkflowExecutor
+            let workflow_executor = debug_session.lock().await;
+            
+            match workflow_executor.get_step_output(&step_id).await {
                 Ok(result) => {
                     println!("Output of step '{}':", step_id);
                     print_flow_result(&result)?;
diff --git a/crates/stepflow-server/src/api/debug.rs b/crates/stepflow-server/src/api/debug.rs
index 915ab5ed..0972929a 100644
--- a/crates/stepflow-server/src/api/debug.rs
+++ b/crates/stepflow-server/src/api/debug.rs
@@ -59,13 +59,16 @@ pub async fn debug_execute_step(
     Json(req): Json<DebugStepRequest>,
 ) -> Result<Json<DebugStepResponse>, ErrorResponse> {
     // Get the debug session for this run
-    let mut debug_session = executor
+    let debug_session = executor
         .debug_session(run_id)
         .await
         .change_context(ServerError::ExecutionNotFound(run_id))?;
 
+    // Lock the mutex to access the WorkflowExecutor
+    let mut workflow_executor = debug_session.lock().await;
+
     // Execute the requested steps
-    let step_results = debug_session.execute_steps(&req.step_ids).await?;
+    let step_results = workflow_executor.execute_steps(&req.step_ids).await?;
 
     // Convert results to the expected format
     let mut results = std::collections::HashMap::new();
@@ -96,13 +99,16 @@ pub async fn debug_continue(
     Path(run_id): Path<Uuid>,
 ) -> Result<Json<super::runs::CreateRunResponse>, ErrorResponse> {
     // Get the debug session for this run
-    let mut debug_session = executor
+    let debug_session = executor
         .debug_session(run_id)
         .await
         .change_context(ServerError::ExecutionNotFound(run_id))?;
 
+    // Lock the mutex to access the WorkflowExecutor
+    let mut workflow_executor = debug_session.lock().await;
+
     // Continue run to completion
-    let final_result = debug_session.execute_to_completion().await?;
+    let final_result = workflow_executor.execute_to_completion().await?;
 
     // Update run status based on the result
     let state_store = executor.state_store();
@@ -149,8 +155,11 @@ pub async fn debug_get_runnable(
         .await
         .change_context(ServerError::ExecutionNotFound(run_id))?;
 
+    // Lock the mutex to access the WorkflowExecutor
+    let workflow_executor = debug_session.lock().await;
+
     // Get runnable steps
-    let runnable_steps = debug_session
+    let runnable_steps = workflow_executor
         .get_runnable_steps()
         .await
         .into_iter()

From 09214b714839c6ccb7b9a4dc8ac213490b5dca08 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Thu, 26 Jun 2025 16:01:00 -0400
Subject: [PATCH 11/14] streams to wav, proc still hangs

---
 Cargo.lock                                    |  25 +
 crates/stepflow-execution/src/error.rs        |   2 +
 .../src/workflow_executor.rs                  | 852 ++++++++----------
 crates/stepflow-plugin/Cargo.toml             |   5 +
 crates/stepflow-plugin/src/lib.rs             |   1 +
 crates/stepflow-plugin/src/streaming.rs       |  32 +
 crates/stepflow-protocol/src/blob_handlers.rs |  76 +-
 examples/audio_input.json                     |   2 +-
 .../src/stepflow_sdk/audio_components.py      |  79 +-
 9 files changed, 513 insertions(+), 561 deletions(-)
 create mode 100644 crates/stepflow-plugin/src/streaming.rs

diff --git a/Cargo.lock b/Cargo.lock
index 720ea251..54f7e7dc 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -559,6 +559,20 @@ dependencies = [
  "typenum",
 ]
 
+[[package]]
+name = "dashmap"
+version = "6.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5041cc499144891f3790297212f32a74fb938e5136a14943f338ef9e0ae276cf"
+dependencies = [
+ "cfg-if",
+ "crossbeam-utils",
+ "hashbrown 0.14.5",
+ "lock_api",
+ "once_cell",
+ "parking_lot_core",
+]
+
 [[package]]
 name = "data-encoding"
 version = "2.9.0"
@@ -1014,6 +1028,12 @@ dependencies = [
  "ahash",
 ]
 
+[[package]]
+name = "hashbrown"
+version = "0.14.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e5274423e17b7c9fc20b6e7e208532f9b19825d82dfd615708b70edd83df41f1"
+
 [[package]]
 name = "hashbrown"
 version = "0.15.4"
@@ -2998,13 +3018,18 @@ dependencies = [
 name = "stepflow-plugin"
 version = "0.1.0"
 dependencies = [
+ "dashmap",
  "dynosaur",
  "error-stack",
  "futures",
+ "once_cell",
  "serde",
+ "serde_json",
  "stepflow-core",
  "stepflow-state",
  "thiserror 2.0.12",
+ "tokio",
+ "tracing",
  "trait-variant",
  "uuid",
 ]
diff --git a/crates/stepflow-execution/src/error.rs b/crates/stepflow-execution/src/error.rs
index be169897..7cf7c294 100644
--- a/crates/stepflow-execution/src/error.rs
+++ b/crates/stepflow-execution/src/error.rs
@@ -42,6 +42,8 @@ pub enum ExecutionError {
     ExecutionNotFound(Uuid),
     #[error("workflow '{0}' not found")]
     WorkflowNotFound(FlowHash),
+    #[error("streaming operation failed")]
+    StreamingError,
 }
 
 pub type Result<T, E = error_stack::Report<ExecutionError>> = std::result::Result<T, E>;
diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index 0032f275..64911ee0 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -1,3 +1,4 @@
+use std::collections::HashMap;
 use std::sync::Arc;
 
 use bit_set::BitSet;
@@ -127,12 +128,20 @@ impl WorkflowExecutor {
                 );
                 
                 tracing::info!("[DEBUG-INIT] Creating streaming coordinator in WorkflowExecutor::new");
+                
+                // Create chunk channel for this execution
+                let (chunk_tx, chunk_rx) = mpsc::channel::<serde_json::Value>(100);
+                
+                // Register the chunk sender in the global registry
+                stepflow_plugin::streaming::register_chunk_sender(execution_id, chunk_tx);
+                
                 let coordinator = StreamingPipelineCoordinator::new(
                     executor.clone(),
                     flow.clone(),
                     pipeline_steps,
                     context.clone(),
                     resolver.clone(),
+                    chunk_rx,
                 );
                 Some(Arc::new(tokio::sync::Mutex::new(coordinator)))
             } else {
@@ -877,8 +886,14 @@ impl WorkflowExecutor {
             return self.execute_streaming_pipeline_step(step_index).await;
         }
 
-        // Fallback to individual streaming step execution
-        self.execute_individual_streaming_step(step_index).await
+        // Log error: Individual streaming step execution (not part of a pipeline)
+        tracing::error!("Streaming step {} is not part of a streaming pipeline, cannot execute individually", step_id);
+        Err(ExecutionError::StepNotRunnable {
+            step: step.id.clone(),
+        }
+        .into())
+
+
     }
 
     /// Check if a step is part of a streaming pipeline (has streaming inputs/outputs)
@@ -1000,174 +1015,7 @@ impl WorkflowExecutor {
         pipeline_steps
     }
 
-    /// Execute an individual streaming step (fallback)
-    async fn execute_individual_streaming_step(&mut self, step_index: usize) -> Result<()> {
-        let step = &self.flow.steps[step_index];
-        let step_id = step.id.clone();
-
-        // Update step status to Running
-        self.state_store
-            .update_step_status(
-                self.context.execution_id(),
-                step_index,
-                stepflow_core::status::StepStatus::Running,
-            )
-            .await
-            .change_context_lazy(|| ExecutionError::StateError)?;
-
-        // Resolve step inputs
-        let step_input = match self.resolver.resolve(&step.input).await? {
-            FlowResult::Success { result } => result,
-            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
-                // For streaming steps, we can handle streaming inputs
-                // For now, just return the metadata as the input
-                metadata
-            }
-            FlowResult::Skipped => {
-                return Err(ExecutionError::StepNotRunnable {
-                    step: step_id.clone(),
-                }
-                .into());
-            }
-            FlowResult::Failed { error } => {
-                return Err(ExecutionError::StepFailed { step: step_id }.into());
-            }
-        };
-
-        // Get plugin
-        let plugin = self.executor.get_plugin(&step.component).await?;
-
-        // For streaming steps, we need to:
-        // 1. Call the step once to start the generator
-        // 2. Wait for streaming chunks to come through the notification system
-        // 3. Process each chunk as it arrives
-        // 4. Stop when the final chunk arrives
-        
-        tracing::info!("[streaming] Starting streaming step {} with initial call", step_id);
-        
-        // Initial call to start the generator
-        let initial_result = execute_step_async(plugin.clone(), step, step_input.clone(), self.context.clone().with_step(step.id.clone())).await?;
-            
-        match initial_result {
-            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
-                tracing::info!("[streaming] Step {} started generator, received initial chunk (index={}, is_final={})", step_id, chunk_index, is_final);
-
-
-                // Process the initial chunk
-                    let mut chunk_input_data = step_input.as_ref().clone();
-                    if let serde_json::Value::Object(ref mut map) = chunk_input_data {
-                        map.insert("chunk".to_string(), serde_json::Value::String(chunk.clone()));
-                        map.insert("stream_id".to_string(), serde_json::Value::String(stream_id.clone()));
-                        map.insert("chunk_index".to_string(), serde_json::Value::Number(chunk_index.into()));
-                        map.insert("is_final".to_string(), serde_json::Value::Bool(is_final));
-                        if let Some(metadata_obj) = metadata.as_ref().as_object() {
-                            for (key, value) in metadata_obj {
-                                map.insert(key.clone(), value.clone());
-                            }
-                        }
-                    }
-                    let chunk_input = stepflow_core::workflow::ValueRef::new(chunk_input_data);
-                    
-                    let chunk_result = match tokio::time::timeout(
-                        std::time::Duration::from_secs(5), 
-                        execute_step_async(plugin.clone(), step, chunk_input, self.context.clone().with_step(step.id.clone()))
-                    ).await {
-                        Ok(result) => result?,
-                        Err(_) => {
-                        tracing::warn!("[streaming] Step {} initial chunk processing timed out", step_id);
-                        // Return a default result for timeout case
-                        FlowResult::Success {
-                            result: stepflow_core::workflow::ValueRef::new(serde_json::json!({
-                                "error": "timeout",
-                                "message": "Initial chunk processing timed out"
-                            }))
-                        }
-                        }
-                    };
-                    
-                    // If this is the final chunk, we're done
-                    if is_final {
-                    tracing::info!("[streaming] Step {} completed with final chunk from initial call", step_id);
-                } else {
-                    // Wait for additional chunks to come through the streaming notification system
-                    // The chunks will be routed via route_streaming_chunk method
-                    tracing::info!("[streaming] Step {} waiting for additional chunks via streaming notifications", step_id);
-                    
-                    // For now, we'll wait a reasonable amount of time for chunks to arrive
-                    // In a more sophisticated implementation, we'd have a proper notification system
-                    let mut chunk_count = 1;
-                    let max_wait_time = std::time::Duration::from_secs(30); // Wait up to 30 seconds
-                    let start_time = std::time::Instant::now();
-                    
-                    while start_time.elapsed() < max_wait_time {
-                        // Sleep briefly to allow chunks to be processed
-                        tokio::time::sleep(std::time::Duration::from_millis(100)).await;
-                        
-                        // Check if we should continue waiting
-                        // This is a simplified approach - in practice, we'd have proper notification handling
-                        chunk_count += 1;
-                        if chunk_count % 100 == 0 {
-                            tracing::debug!("[streaming] Step {} still waiting for chunks, elapsed: {:?}", step_id, start_time.elapsed());
-                        }
-                    }
-                    
-                    tracing::info!("[streaming] Step {} finished waiting for chunks, elapsed: {:?}", step_id, start_time.elapsed());
-                    }
-                }
-                FlowResult::Success { result } => {
-                    // Non-streaming result, treat as final
-                    tracing::debug!("Streaming step {} completed with success", step_id);
-                }
-                FlowResult::Failed { error } => {
-                    tracing::error!("Streaming step {} failed: {:?}", step_id, error);
-                    
-                    // Update step status to Failed
-                    self.state_store
-                        .update_step_status(
-                            self.context.execution_id(),
-                            step_index,
-                            stepflow_core::status::StepStatus::Failed,
-                        )
-                        .await
-                        .change_context_lazy(|| ExecutionError::StateError)?;
-                    
-                    return Err(ExecutionError::StepFailed { step: step_id }.into());
-                }
-                FlowResult::Skipped => {
-                    tracing::debug!("Streaming step {} skipped", step_id);
-            }
-        }
-
-        // Update step status to Completed
-        self.state_store
-            .update_step_status(
-                self.context.execution_id(),
-                step_index,
-                stepflow_core::status::StepStatus::Completed,
-            )
-            .await
-            .change_context_lazy(|| ExecutionError::StateError)?;
-
-        // Update dependency tracker for streaming step
-        self.tracker.complete_step(step_index);
-
-        Ok(())
-    }
 
-    /// Route a streaming chunk to the appropriate streaming pipeline
-    pub async fn route_streaming_chunk(&mut self, chunk: serde_json::Value) -> Result<()> {
-        tracing::info!("ROUTE_CHUNK[exec={} addr={:p}] called", self.execution_id(), self as *const _);
-        
-        if let Some(coord_arc) = &self.streaming_coordinator {
-            // Route chunks directly to the coordinator used by run_pipeline_without_lock
-            // This ensures chunks are sent to the same channels that the step tasks are listening on
-            StreamingPipelineCoordinator::route_chunk_to_running_pipeline(coord_arc.clone(), chunk).await?;
-        } else {
-            tracing::warn!("No streaming pipeline active for exec {}", self.execution_id());
-        }
-        Ok(())
-    }
-    
     /// Find currently active streaming steps using in-memory workflow information
     /// This avoids depending on state store data that might be cleaned up
     fn find_active_streaming_steps_in_memory(&self) -> Vec<usize> {
@@ -1191,6 +1039,15 @@ impl WorkflowExecutor {
 
 }
 
+impl Drop for WorkflowExecutor {
+    fn drop(&mut self) {
+        // Clean up the global chunk sender registry when the executor is dropped
+        let execution_id = self.execution_id();
+        stepflow_plugin::streaming::unregister_chunk_sender(execution_id);
+        tracing::debug!("Cleaned up chunk sender for execution {}", execution_id);
+    }
+}
+
 /// Execute a single step asynchronously.
 pub(crate) async fn execute_step_async(
     plugin: Arc<DynPlugin<'static>>,
@@ -1291,164 +1148,14 @@ struct StreamingPipelineCoordinator {
     pipeline_steps: Vec<usize>,
     context: ExecutionContext,
     resolver: ValueResolver,
-    step_receivers: std::collections::HashMap<String, mpsc::Receiver<FlowResult>>,
-    step_downstream_senders: std::collections::HashMap<String, Vec<mpsc::Sender<FlowResult>>>,
-    step_senders: std::collections::HashMap<String, mpsc::Sender<FlowResult>>,
+    step_downstream_senders: HashMap<String, Vec<(String, mpsc::Sender<FlowResult>)>>,
+    step_receivers: HashMap<String, mpsc::Receiver<FlowResult>>,
+    step_senders: HashMap<String, mpsc::Sender<FlowResult>>,
+    incoming_chunks: mpsc::Receiver<serde_json::Value>,
 }
 
 impl StreamingPipelineCoordinator {
-    /// Route chunks to the running pipeline without requiring mutable access to the coordinator
-    /// This allows chunks to be routed while the receivers are moved out for step tasks
-    pub async fn route_chunk_to_running_pipeline(
-        coord_arc: Arc<tokio::sync::Mutex<StreamingPipelineCoordinator>>,
-        chunk_json: serde_json::Value,
-    ) -> Result<()> {
-        let map = serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk_json)
-            .map_err(|e| ExecutionError::MalformedReference { message: e.to_string() })?;
-        
-        // Extract chunk metadata
-        let chunk_index = map.get("chunk_index")
-                             .and_then(|v| v.as_u64())
-                             .unwrap_or(0) as usize;
-        
-        let is_final = map.get("is_final")
-                          .and_then(|v| v.as_bool())
-                          .unwrap_or(false);
-        
-        // Extract the step ID this chunk came FROM
-        let source_step_id = if let Some(step_id) = map.get("step_id").and_then(|v| v.as_str()) {
-            step_id.to_string()
-        } else {
-            // Default to first step if no step_id provided
-            let coord = coord_arc.lock().await;
-            let first_step_idx = coord.pipeline_steps[0];
-            let first_step_id = coord.flow.steps[first_step_idx].id.clone();
-            tracing::info!("No step_id in chunk, defaulting to first pipeline step: {}", first_step_id);
-            drop(coord); // Release the lock early
-            first_step_id
-        };
-        
-        let coord = coord_arc.lock().await;
-        
-        // Find the index of the source step in the pipeline
-        let source_step_pipeline_index = coord.pipeline_steps.iter()
-            .enumerate()
-            .find_map(|(i, &step_idx)| {
-                if coord.flow.steps[step_idx].id == source_step_id {
-                    Some(i)
-                } else {
-                    None
-                }
-            });
-        
-        // Find the next step in the pipeline (if any)
-        let target_step_id = if let Some(source_idx) = source_step_pipeline_index {
-            if source_idx + 1 < coord.pipeline_steps.len() {
-                // Get the next step in the pipeline
-                let next_step_idx = coord.pipeline_steps[source_idx + 1];
-                let next_step_id = coord.flow.steps[next_step_idx].id.clone();
-                tracing::info!("Routing chunk from step {} to next step {}", source_step_id, next_step_id);
-                next_step_id
-            } else {
-                // This is the last step in the pipeline, no forwarding needed
-                tracing::info!("Step {} is the last in pipeline, no forwarding needed", source_step_id);
-                return Ok(());
-            }
-        } else {
-            // Couldn't find the source step in the pipeline, use the source step ID as fallback
-            tracing::warn!("Could not find step {} in pipeline, using as target", source_step_id);
-            source_step_id.clone()
-        };
-        
-        // Send to the target step's channel
-        if let Some(tx) = coord.step_senders.get(&target_step_id) {
-            tracing::info!("[SEND-DEBUG] Found sender for target step {}, attempting to send chunk {} (tx addr: {:p})", 
-                          target_step_id, chunk_index, tx);
-            
-            // Create a FlowResult from the chunk data
-            let fr = FlowResult::Streaming {
-                stream_id: map.get("stream_id")
-                             .and_then(|v| v.as_str())
-                             .unwrap_or("unknown")
-                             .to_string(),
-                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!(map)),
-                chunk: map.get("chunk")
-                         .and_then(|v| v.as_str())
-                         .unwrap_or("")
-                         .to_string(),
-                chunk_index,
-                is_final,
-            };
-            
-            match tx.send(fr.clone()).await {
-                Ok(_) => {
-                    tracing::info!("[SEND-DEBUG] Successfully routed chunk {} from step {} to step {}", 
-                                  chunk_index, source_step_id, target_step_id);
-                }
-                Err(e) => {
-                    tracing::error!("[SEND-DEBUG] Failed to send chunk {} to step {}: {:?}", 
-                                   chunk_index, target_step_id, e);
-                    return Err(ExecutionError::StepFailed { step: target_step_id.clone() }.into());
-                }
-            }
-        } else {
-            tracing::warn!("[SEND-DEBUG] No channel for target step {} (available steps: {:?})", 
-                          target_step_id, coord.step_senders.keys().collect::<Vec<_>>());
-        }
-
-        Ok(())
-    }
-
-    /// Called by `WorkflowExecutor::route_streaming_chunk` to inject
-    /// *all* the chunks, not just the first.
-    pub async fn handle_chunk(&mut self, chunk_json: serde_json::Value) -> Result<()> {
-        let map = serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk_json)
-            .map_err(|e| ExecutionError::MalformedReference { message: e.to_string() })?;
-        
-        // Extract the step ID this chunk belongs to (default to first pipeline step)
-        let step_id = map.get("step_id")
-                          .and_then(|v| v.as_str())
-                          .map(|s| s.to_string())
-                          .unwrap_or_else(|| {
-                              // Default to first step (source step) if no step_id provided
-                              // This handles chunks coming from Python components that don't include step_id
-                              let first_step_idx = self.pipeline_steps[0];
-                              let first_step_id = self.flow.steps[first_step_idx].id.clone();
-                              tracing::info!("No step_id in chunk, defaulting to first pipeline step: {}", first_step_id);
-                              first_step_id
-                          });
-                          
-        let stream_id   = map.get("stream_id")  .and_then(|v| v.as_str()).unwrap_or_default().to_string();
-        let chunk_index = map.get("chunk_index").and_then(|v| v.as_u64()).unwrap_or(0) as usize;
-        let is_final    = map.get("is_final")   .and_then(|v| v.as_bool()).unwrap_or(false);
-
-        // Build the FlowResult
-        let fr = FlowResult::Streaming {
-            stream_id: stream_id.clone(),
-            metadata: stepflow_core::workflow::ValueRef::new(serde_json::Value::Object(map.clone())),
-            chunk: map.get("chunk").and_then(|v|v.as_str()).unwrap_or("").to_string(),
-            chunk_index,
-            is_final,
-        };
 
-        // Only deliver to the step itself - let the step handle forwarding downstream
-        if let Some(tx) = self.step_senders.get(&step_id) {
-            tracing::info!("Found sender for step {}, attempting to send chunk {}", step_id, chunk_index);
-            match tx.send(fr.clone()).await {
-                Ok(_) => {
-                    tracing::info!("Successfully routed chunk {} to step {} (pipeline steps: {:?})", chunk_index, step_id, self.pipeline_steps);
-                }
-                Err(e) => {
-                    tracing::error!("Failed to route chunk {} to step {}: {:?}", chunk_index, step_id, e);
-                    return Err(ExecutionError::StepFailed { step: step_id.clone() }.into());
-                }
-            }
-        } else {
-            tracing::warn!("No channel for step {} (available steps: {:?})", step_id, self.step_senders.keys().collect::<Vec<_>>());
-        }
-
-        Ok(())
-    }
 
     fn new(
         executor: Arc<StepFlowExecutor>,
@@ -1456,6 +1163,7 @@ impl StreamingPipelineCoordinator {
         pipeline_steps: Vec<usize>,
         context: ExecutionContext,
         resolver: ValueResolver,
+        incoming_chunks: mpsc::Receiver<serde_json::Value>,
     ) -> Self {
         let mut step_receivers = std::collections::HashMap::new();
         let mut step_downstream_senders = std::collections::HashMap::new();
@@ -1469,13 +1177,11 @@ impl StreamingPipelineCoordinator {
             let (input_tx, input_rx) = tokio::sync::mpsc::channel(100);
             let sender_clone = input_tx.clone();
             
-            // Log channel creation with memory addresses
+            // Log channel creation
             tracing::info!(
-                "[CHANNEL-DEBUG] Created channel for step {} (index {}): tx={:p}, rx={:p}", 
+                "[CHANNEL-DEBUG] Created channel for step {} (index {})", 
                 step_id, 
-                step_index, 
-                &sender_clone as *const _,
-                &input_rx as *const _
+                step_index
             );
             
             step_senders.insert(step_id.clone(), sender_clone);
@@ -1490,16 +1196,16 @@ impl StreamingPipelineCoordinator {
             tracing::info!("[DEBUG-CHANNEL-SETUP] Processing step {} ({}) at position {}", step_id, step_index, i);
             
             // Set up downstream senders for this step
-            let mut downstream_senders = Vec::new();
+            let mut downstream_connections = Vec::new();
             if i < pipeline_steps.len() - 1 {
                 // This step sends to the next step's input
                 let next_step_index = pipeline_steps[i + 1];
                 let next_step_id = flow.steps[next_step_index].id.clone();
                 if let Some(next_step_sender) = step_senders.get(&next_step_id).cloned() {
-                    downstream_senders.push(next_step_sender);
+                    downstream_connections.push((next_step_id.clone(), next_step_sender));
                 }
             }
-            step_downstream_senders.insert(step_id, downstream_senders);
+            step_downstream_senders.insert(step_id, downstream_connections);
         }
 
         Self {
@@ -1511,6 +1217,7 @@ impl StreamingPipelineCoordinator {
             step_receivers,
             step_downstream_senders,
             step_senders,
+            incoming_chunks,
         }
     }
 
@@ -1582,34 +1289,34 @@ impl StreamingPipelineCoordinator {
             let guard = coord_arc.lock().await;
             (guard.flow.clone(), guard.pipeline_steps.clone())
         };
-        
+
         // Give all tasks a moment to start
         tracing::info!("[DEBUG-PIPELINE] Giving tasks 500ms to start up");
         tokio::time::sleep(std::time::Duration::from_millis(500)).await;
-        
+
         // Now trigger the source component to start generating chunks
         if let Some(source_step_idx) = pipeline_steps.first() {
             let source_step_id = flow.steps[*source_step_idx].id.clone();
             tracing::info!("[DEBUG-PIPELINE] Triggering source component {} to start generating", source_step_id);
-            
+
             // Get the step input for the source step
             let source_input = {
                 let guard = coord_arc.lock().await;
                 guard.resolve_step_input(*source_step_idx).await?
             };
-            
+
             // Get the plugin for the source step
             let source_plugin = {
                 let guard = coord_arc.lock().await;
                 guard.executor.get_plugin(&flow.steps[*source_step_idx].component).await?
             };
-            
+
             // Create execution context for the source step
             let source_context = {
                 let guard = coord_arc.lock().await;
                 guard.context.clone().with_step(source_step_id.clone())
             };
-            
+
             // Trigger the source component in a separate task (fire and forget)
             let source_step = flow.steps[*source_step_idx].clone();
             tokio::spawn(async move {
@@ -1624,29 +1331,210 @@ impl StreamingPipelineCoordinator {
                 }
             });
         }
+
+        // Main loop: handle both incoming chunks and step completion using tokio::select
+        tracing::info!("[DEBUG-PIPELINE] Starting main loop to handle chunks and step completion");
+        let mut remaining_handles = handles;
+
+        // Extract incoming chunks receiver from coordinator
+        let mut incoming_chunks_rx = {
+            let mut guard = coord_arc.lock().await;
+            // Move the receiver out of the coordinator for the main loop
+            let (dummy_tx, dummy_rx) = mpsc::channel::<serde_json::Value>(1);
+            std::mem::replace(&mut guard.incoming_chunks, dummy_rx)
+        };
+
+        loop {
+            tokio::select! {
+                // Handle incoming chunks from the global registry
+                Some(chunk_json) = incoming_chunks_rx.recv() => {
+                    tracing::info!("Main loop received chunk from global registry");
+
+                    // Route the chunk to the appropriate step without locking the coordinator
+                    match Self::route_chunk_to_steps(&coord_arc, chunk_json).await {
+                        Ok(_) => {
+                            tracing::info!("Successfully routed chunk to step");
+                        }
+                        Err(e) => {
+                            tracing::error!("Failed to route chunk to step: {:?}", e);
+                        }
+                    }
+                }
+
+                // Handle step completions
+                _ = async {
+                    // Check if any handles are ready
+                    let mut i = 0;
+                    while i < remaining_handles.len() {
+                        let (step_idx, handle) = &mut remaining_handles[i];
+                        if handle.is_finished() {
+                            let (step_idx, handle) = remaining_handles.remove(i);
+                            let step_id = &flow.steps[step_idx].id;
+
+                            match handle.await {
+                                Ok(result) => {
+                                    if let Err(e) = result {
+                                        tracing::warn!("Step {} completed with error: {:?}", step_id, e);
+                                        return Err(e);
+                                    } else {
+                                        tracing::info!("Step {} completed successfully", step_id);
+                                    }
+                                }
+                                Err(e) => {
+                                    tracing::warn!("Step {} task panicked: {:?}", step_id, e);
+                                    return Err(ExecutionError::Internal.into());
+                                }
+                            }
+                        } else {
+                            i += 1;
+                        }
+                    }
+
+                    // If no handles completed, sleep briefly to avoid busy loop
+                    if !remaining_handles.is_empty() {
+                        tokio::time::sleep(std::time::Duration::from_millis(10)).await;
+                    }
+
+                    Ok::<(), error_stack::Report<crate::ExecutionError>>(())
+                } => {
+                    // Handle step completion result
+                }
+            }
+
+            // Exit when all handles are done
+            if remaining_handles.is_empty() {
+                tracing::info!("[DEBUG-PIPELINE] All step handles completed");
+                break;
+            }
+        }
+
+        tracing::info!("[DEBUG-PIPELINE] run_pipeline_without_lock completed successfully");
+        Ok(())
+    }
+
+    /// Route a chunk to the appropriate step without requiring a full coordinator lock
+    async fn route_chunk_to_steps(
+        coord_arc: &Arc<tokio::sync::Mutex<Self>>,
+        chunk_json: serde_json::Value,
+    ) -> Result<()> {
+        let map = serde_json::from_value::<serde_json::Map<String, serde_json::Value>>(chunk_json)
+            .map_err(|e| ExecutionError::MalformedReference { message: e.to_string() })?;
+
+        // Extract chunk metadata from top-level map first
+        let chunk_index = map.get("chunk_index").and_then(|v| v.as_u64()).unwrap_or(0) as usize;
+        let mut is_final = map.get("is_final").and_then(|v| v.as_bool()).unwrap_or(false);
+        let source_step_id = map.get("step_id").and_then(|v| v.as_str()).map(|s| s.to_string());
         
-        // Wait for all step handles to complete
-        tracing::info!("[DEBUG-PIPELINE] Waiting for all {} step handles to complete", handles.len());
-        for (step_idx, handle) in handles {
-            let step_id = &flow.steps[step_idx].id;
-            tracing::info!("[DEBUG-PIPELINE] Waiting for step {} to complete", step_id);
-            match handle.await {
-                Ok(result) => {
-                    if let Err(e) = result {
-                        tracing::warn!("Step {} completed with error: {:?}", step_id, e);
-                        return Err(e);
+        // If we have a nested chunk object, also check its is_final flag (it takes precedence)
+        if let Some(chunk_obj) = map.get("chunk").and_then(|v| v.as_object()) {
+            if let Some(nested_is_final) = chunk_obj.get("is_final").and_then(|v| v.as_bool()) {
+                tracing::warn!("CHUNK_ROUTING_DEBUG: Using nested is_final={} instead of top-level is_final={}", nested_is_final, is_final);
+                is_final = nested_is_final;
+            }
+        }
+
+        tracing::debug!("Routing chunk {} from step {:?} (is_final={})", chunk_index, source_step_id, is_final);
+        
+        if is_final {
+            tracing::warn!("FINAL_CHUNK_TRACKING: Routing final chunk {} from step {:?}", chunk_index, source_step_id);
+        }
+
+        // Get the information we need from the coordinator briefly
+        let (target_step_id, step_senders) = {
+            let coord = coord_arc.lock().await;
+
+            let source_step_id = source_step_id.unwrap_or_else(|| {
+                let first_step_idx = coord.pipeline_steps[0];
+                coord.flow.steps[first_step_idx].id.clone()
+            });
+
+            // Find the target step (next in pipeline after source)
+            let source_step_pipeline_index = coord.pipeline_steps.iter()
+                .enumerate()
+                .find_map(|(i, &step_idx)| {
+                    if coord.flow.steps[step_idx].id == source_step_id {
+                        Some(i)
                     } else {
-                        tracing::info!("Step {} completed successfully", step_id);
+                        None
                     }
+                });
+
+            let target_step_id = if let Some(source_idx) = source_step_pipeline_index {
+                if source_idx + 1 < coord.pipeline_steps.len() {
+                    let target_step_idx = coord.pipeline_steps[source_idx + 1];
+                    coord.flow.steps[target_step_idx].id.clone()
+                } else {
+                    // This is the last step, no target
+                    return Ok(());
+                }
+            } else {
+                // Source step not found in pipeline
+                return Ok(());
+            };
+
+            (target_step_id, coord.step_senders.clone())
+        };
+
+        // Send to the target step's channel
+        if let Some(tx) = step_senders.get(&target_step_id) {
+            // Debug the map structure
+            tracing::warn!("CHUNK_ROUTING_DEBUG: map keys: {:?}", map.keys().collect::<Vec<_>>());
+            
+            // Extract chunk data - handle nested component response format
+            let chunk_str = if let Some(chunk_value) = map.get("chunk") {
+                tracing::warn!("CHUNK_ROUTING_DEBUG: found chunk field, type: {:?}", std::mem::discriminant(chunk_value));
+                
+                if let Some(chunk_str) = chunk_value.as_str() {
+                    // Direct string chunk
+                    tracing::warn!("CHUNK_ROUTING_DEBUG: chunk as string, len: {}", chunk_str.len());
+                    chunk_str
+                } else if let Some(chunk_obj) = chunk_value.as_object() {
+                    // Nested object - extract the inner "chunk" field
+                    tracing::warn!("CHUNK_ROUTING_DEBUG: chunk is nested object, extracting inner chunk");
+                    if let Some(inner_chunk) = chunk_obj.get("chunk").and_then(|v| v.as_str()) {
+                        tracing::warn!("CHUNK_ROUTING_DEBUG: extracted inner chunk, len: {}", inner_chunk.len());
+                        inner_chunk
+                    } else {
+                        tracing::warn!("CHUNK_ROUTING_DEBUG: no inner chunk field found in nested object");
+                        ""
+                    }
+                } else {
+                    tracing::warn!("CHUNK_ROUTING_DEBUG: chunk field is not a string or object");
+                    ""
+                }
+            } else {
+                tracing::warn!("CHUNK_ROUTING_DEBUG: no chunk field found");
+                ""
+            };
+            
+            tracing::warn!("CHUNK_ROUTING_DEBUG: final extracted chunk_str_len={}", chunk_str.len());
+            
+            // Create a FlowResult from the chunk data
+            let fr = FlowResult::Streaming {
+                stream_id: map.get("stream_id").and_then(|v| v.as_str()).unwrap_or("unknown").to_string(),
+                metadata: stepflow_core::workflow::ValueRef::new(serde_json::json!(map)),
+                chunk: chunk_str.to_string(),
+                chunk_index,
+                is_final,
+            };
+
+            match tx.send(fr).await {
+                Ok(_) => {
+                    tracing::debug!("Successfully routed chunk {} to step {}", chunk_index, target_step_id);
                 }
                 Err(e) => {
-                    tracing::warn!("Step {} task panicked: {:?}", step_id, e);
-                    return Err(ExecutionError::Internal.into());
+                    if is_final {
+                        tracing::info!("Ignoring send error for final chunk as step might have completed");
+                        return Ok(());
+                    }
+                    tracing::error!("Failed to send chunk {} to step {}: {:?}", chunk_index, target_step_id, e);
+                    return Err(ExecutionError::StepFailed { step: target_step_id }.into());
                 }
             }
+        } else {
+            tracing::warn!("No channel for target step {}", target_step_id);
         }
-        
-        tracing::info!("[DEBUG-PIPELINE] run_pipeline_without_lock completed successfully");
+
         Ok(())
     }
 
@@ -1654,20 +1542,18 @@ impl StreamingPipelineCoordinator {
         // For streaming steps, we need simpler input resolution
         // since they don't depend on other steps' outputs
         let step = &self.flow.steps[step_index];
-        
-        // For streaming steps, resolve the input directly without dependencies
-        // This avoids the "undefined value" error for streaming pipelines
+
+        // For streaming steps, resolve the input expression directly
+        // If it fails, fall back to the workflow input
         if step.streaming {
-            // For streaming steps, try to resolve the input expression directly
-            // If it fails, fall back to the workflow input
             match self.resolver.resolve(&step.input).await {
                 Ok(FlowResult::Success { result }) => Ok(result),
                 Ok(FlowResult::Streaming { metadata, .. }) => Ok(metadata),
-                                 _ => {
-                     // Fall back to workflow input for streaming steps
-                     tracing::info!("[DEBUG-RESOLVE] Falling back to workflow input for streaming step {}", step.id);
-                     Ok(self.resolver.workflow_input().clone())
-                 }
+                _ => {
+                    // Fall back to workflow input for streaming steps
+                    tracing::info!("[DEBUG-RESOLVE] Falling back to workflow input for streaming step {}", step.id);
+                    Ok(self.resolver.workflow_input().clone())
+                }
             }
         } else {
             // For non-streaming steps, use the full resolver
@@ -1699,12 +1585,18 @@ async fn run_streaming_step_simple(
     input: stepflow_core::workflow::ValueRef,
     context: ExecutionContext,
     mut rx: mpsc::Receiver<FlowResult>,
-    downstream: Vec<mpsc::Sender<FlowResult>>,
+    downstream: Vec<(String, mpsc::Sender<FlowResult>)>,
     is_source: bool,
 ) -> Result<()> {
     let step_id = step.id.clone();
     stream_log!(info, &step_id, "starting (is_source={}, downstream={})", is_source, downstream.len());
-    
+
+    // Log channel details with step names
+    stream_log!(info, &step_id, "receiver ready");
+    for (i, (downstream_id, tx)) in downstream.iter().enumerate() {
+        stream_log!(info, &step_id, "downstream[{}] to step {} is_closed: {}", i, downstream_id, tx.is_closed());
+    }
+
     // For source steps, we now rely on the notification system to start the generator
     // The generator will be triggered when the first chunk request comes in
     if is_source {
@@ -1719,19 +1611,14 @@ async fn run_streaming_step_simple(
     let mut last_chunk = String::new();
     let mut last_chunk_index = 0;
     let mut last_is_final = false;
-    
+
     loop {
-        tracing::info!("[STREAM] Step {} waiting for chunk via receiver", step_id);
-        // Before waiting for data, log channel details
-        tracing::info!(
-            "[STREAM-DEBUG] Step {} waiting for chunk via receiver (rx addr: {:p})", 
-            step_id, 
-            &rx as *const _
-        );
+        stream_log!(info, &step_id, "waiting for chunk via receiver (is_closed: {})", rx.is_closed());
 
         // Check if the channel has been closed already
         if rx.is_closed() {
             stream_log!(warn, &step_id, "channel is already closed before receiving any data");
+            break;
         }
 
         // Add timeout to prevent indefinite blocking
@@ -1740,65 +1627,77 @@ async fn run_streaming_step_simple(
             rx.recv()
         ).await {
             Ok(result) => {
-                tracing::info!(
-                    "[STREAM-DEBUG] Step {} received data from channel: is_some={}", 
-                    step_id, 
-                    result.is_some()
-                );
+                stream_log!(info, &step_id, "received data from channel: is_some={}", result.is_some());
                 result
             },
             Err(_) => {
                 stream_log!(warn, &step_id, "TIMEOUT waiting for chunk after 10 seconds");
-                // Continue with loop to try again or return None to exit
-                None
+                // Continue with loop to try again
+                continue;
             }
         };
 
         match recv_result {
             Some(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final }) => {
-                stream_log!(info, &step_id, "RECEIVED chunk #{} from receiver", chunk_index);
-                tracing::info!("RX step={} idx={} final={} (source={})", step_id, chunk_index, is_final, is_source);
-                stream_log!(info, &step_id, "processing chunk #{}", chunk_index);
+                stream_log!(info, &step_id, "RECEIVED chunk #{} from receiver (chunk len: {})", chunk_index, chunk.len());
+                stream_log!(info, &step_id, "processing chunk #{} (is_final={}) - VALIDATION: received chunk len={}", chunk_index, is_final, chunk.len());
                 
+                if is_final {
+                    stream_log!(warn, &step_id, "FINAL_CHUNK_TRACKING: Received final chunk #{} - will forward to downstream", chunk_index);
+                }
+
                 // Store the streaming metadata for potential use in non-streaming case
                 last_stream_id = stream_id.clone();
                 last_metadata = metadata.clone();
                 last_chunk = chunk.clone();
                 last_chunk_index = chunk_index;
                 last_is_final = is_final;
-                
-                // For non-source steps, call the component to process the chunk
-                let (final_stream_id, final_metadata, final_chunk, final_chunk_index, final_is_final) = if !is_source {
-                    // For non-source steps, we need to create a proper input that contains only the actual data
-                    // without any $from references, by extracting the relevant fields from the streaming chunk
+
+                // Process the chunk with the component (for non-source steps)
+                let (final_stream_id, final_metadata, final_chunk, final_chunk_index, final_is_final) =
+                if !is_source {
+                    // For non-source steps, process the chunk with the component
+                    stream_log!(info, &step_id, "calling component with chunk #{} (input chunk len: {})", chunk_index, chunk.len());
+
+                    // Create input for the component from the chunk
                     let chunk_input_data = serde_json::json!({
-                        "chunk": chunk,
                         "stream_id": stream_id,
+                        "chunk": chunk,
                         "chunk_index": chunk_index,
                         "is_final": is_final,
-                        // Add all the metadata fields from the streaming chunk
-                        "sample_rate": metadata.as_ref().get("sample_rate").unwrap_or(&serde_json::Value::Null),
-                        "channels": metadata.as_ref().get("channels").unwrap_or(&serde_json::Value::Null),
-                        "operation": metadata.as_ref().get("operation").unwrap_or(&serde_json::Value::Null),
-                        "output_file": metadata.as_ref().get("output_file").unwrap_or(&serde_json::Value::Null),
-                        "gain": metadata.as_ref().get("gain").unwrap_or(&serde_json::Value::Null),
+                        "metadata": metadata.as_ref()
                     });
+
+                    // Call the component with the chunk
                     let chunk_input = stepflow_core::workflow::ValueRef::new(chunk_input_data);
+                    stream_log!(info, &step_id, "sending input to component: chunk_len={}, stream_id={}", chunk.len(), stream_id);
                     
-                    // Call the component to process the chunk
-                    let step_context = context.clone().with_step(step.id.clone());
-                    match execute_step_async(plugin.clone(), &step, chunk_input, step_context).await? {
-                        FlowResult::Streaming { stream_id: processed_stream_id, metadata: processed_metadata, chunk: processed_chunk, chunk_index: processed_chunk_index, is_final: processed_is_final } => {
-                            tracing::info!("[STREAM] Step {} component processed chunk #{}", step_id, processed_chunk_index);
-                            (processed_stream_id, processed_metadata, processed_chunk, processed_chunk_index, processed_is_final)
-                        }
-                        FlowResult::Success { .. } => {
-                            tracing::info!("[STREAM] Step {} component returned success, forwarding original chunk", step_id);
+                    let component_result = execute_step_async(
+                        plugin.clone(),
+                        &step,
+                        chunk_input,
+                        context.clone().with_step(step.id.clone())
+                    ).await;
+
+                    match component_result {
+                        Ok(FlowResult::Success { result }) => {
+                            stream_log!(info, &step_id, "component returned success for chunk #{}", chunk_index);
                             // For success results, forward the original chunk
                             (stream_id, metadata, chunk, chunk_index, is_final)
                         }
-                        other => {
-                            tracing::warn!("[STREAM] Step {} component returned unexpected result: {:?}", step_id, other);
+                        Ok(FlowResult::Streaming { stream_id: new_stream_id, metadata: new_metadata, chunk: new_chunk, chunk_index: new_chunk_index, is_final: new_is_final }) => {
+                            stream_log!(info, &step_id, "component returned streaming result for chunk #{} - OUTPUT chunk len: {}", chunk_index, new_chunk.len());
+                            stream_log!(warn, &step_id, "VALIDATION: input_chunk_len={}, output_chunk_len={}, input_stream_id={}, output_stream_id={}", chunk.len(), new_chunk.len(), stream_id, new_stream_id);
+                            // Component returned a streaming result, use it
+                            (new_stream_id, new_metadata, new_chunk, new_chunk_index, new_is_final)
+                        }
+                        Ok(other) => {
+                            stream_log!(warn, &step_id, "component returned unexpected result for chunk #{}: {:?}", chunk_index, other);
+                            (stream_id, metadata, chunk, chunk_index, is_final)
+                        }
+                        Err(e) => {
+                            stream_log!(error, &step_id, "component failed processing chunk #{}: {:?}", chunk_index, e);
+                            // On error, still forward the original chunk but log the error
                             (stream_id, metadata, chunk, chunk_index, is_final)
                         }
                     }
@@ -1806,80 +1705,81 @@ async fn run_streaming_step_simple(
                     // Source step just forwards the chunk as-is
                     (stream_id, metadata, chunk, chunk_index, is_final)
                 };
-                
+
                 // Forward to downstream steps
-                stream_log!(info, &step_id, "forwarding chunk #{} to {} downstream", final_chunk_index, downstream.len());
+                stream_log!(info, &step_id, "forwarding chunk #{} to {} downstream steps (final_chunk len: {}) is_final={}", final_chunk_index, downstream.len(), final_chunk.len(), final_is_final);
+                
+                if final_is_final {
+                    stream_log!(warn, &step_id, "FINAL_CHUNK_TRACKING: Forwarding final chunk #{} to {} downstream steps", final_chunk_index, downstream.len());
+                }
+
                 if downstream.is_empty() {
                     stream_log!(warn, &step_id, "no downstream channels to forward to!");
                 }
-                for (i, tx) in downstream.iter().enumerate() {
-                    match tx.send(FlowResult::Streaming {
+
+                // Check if any downstream channels are closed
+                let closed_channels = downstream.iter()
+                    .enumerate()
+                    //.filter(|pair| pair.1.1.is_closed())
+                    .filter(|(_, (_, sender))| sender.is_closed())
+                    .map(|(i, _)| i)
+                    .collect::<Vec<_>>();
+
+                if !closed_channels.is_empty() {
+                    stream_log!(warn, &step_id, "downstream channels closed: {:?}", closed_channels);
+                }
+
+                // Forward to all downstream steps
+                for (i, (downstream_id, tx)) in downstream.iter().enumerate() {
+                    if tx.is_closed() {
+                        stream_log!(warn, &step_id, "skipping downstream[{}] to step {} - channel is closed", i, downstream_id);
+                        continue;
+                    }
+
+                    let fr = FlowResult::Streaming {
                         stream_id: final_stream_id.clone(),
                         metadata: final_metadata.clone(),
                         chunk: final_chunk.clone(),
                         chunk_index: final_chunk_index,
                         is_final: final_is_final,
-                    }).await {
+                    };
+
+                    match tx.send(fr).await {
                         Ok(_) => {
-                            stream_log!(info, &step_id, "successfully forwarded chunk #{} to downstream {}", final_chunk_index, i);
+                            stream_log!(info, &step_id, "forwarded chunk #{} to downstream[{}] (step {}) is_final={}",
+                                final_chunk_index, i, downstream_id, final_is_final);
+                            if final_is_final {
+                                stream_log!(warn, &step_id, "FINAL_CHUNK_TRACKING: Successfully forwarded final chunk to step {}", downstream_id);
+                            }
                         }
                         Err(e) => {
-                            stream_log!(warn, &step_id, "failed to forward chunk #{} to downstream {}: {:?}", final_chunk_index, i, e);
+                            stream_log!(error, &step_id, "failed to forward chunk #{} to downstream[{}] (step {}): {:?}",
+                                final_chunk_index, i, downstream_id, e);
+                            if final_is_final {
+                                stream_log!(error, &step_id, "FINAL_CHUNK_TRACKING: FAILED to forward final chunk to step {}: {:?}", downstream_id, e);
+                            }
                         }
                     }
                 }
 
-                // Stop the *source* task once it sees its own final packet.
-                // Every other task keeps listening until its inbound channel is closed.
-                if is_source && final_is_final {
-                    stream_log!(info, &step_id, "saw final chunk, exiting");
+                // If this is the final chunk, exit the loop
+                if final_is_final {
+                    stream_log!(info, &step_id, "received final chunk, exiting streaming loop");
                     break;
                 }
             }
             Some(other) => {
                 stream_log!(warn, &step_id, "received non-streaming result: {:?}", other);
-                // Extract actual data from the non-streaming result and forward it as streaming
-                match other {
-                    FlowResult::Success { result } => {
-                        // Convert the success result to a streaming chunk
-                        for tx in &downstream {
-                            let _ = tx.send(FlowResult::Streaming {
-                                stream_id: last_stream_id.clone(),
-                                metadata: result.clone(),
-                                chunk: serde_json::to_string(result.as_ref()).unwrap_or_default(),
-                                chunk_index: last_chunk_index,
-                                is_final: last_is_final,
-                            }).await;
-                        }
-                    }
-                    _ => {
-                        // For other result types, use last known metadata
-                        for tx in &downstream {
-                            let _ = tx.send(FlowResult::Streaming {
-                                stream_id: last_stream_id.clone(),
-                                metadata: last_metadata.clone(),
-                                chunk: last_chunk.clone(),
-                                chunk_index: last_chunk_index,
-                                is_final: last_is_final,
-                            }).await;
-                        }
-                    }
-                }
-                // Only exit if this was truly the final chunk
-                if last_is_final {
-                    stream_log!(info, &step_id, "received final packet in non-streaming arm, exiting");
-                    break;
-                }
-                // Otherwise keep looping to process more chunks
+                // Handle non-streaming results...
             }
             None => {
-                stream_log!(info, &step_id, "channel closed");
+                stream_log!(warn, &step_id, "receiver channel closed, exiting streaming loop");
                 break;
             }
         }
     }
-    
-    stream_log!(info, &step_id, "completed");
+
+    stream_log!(info, &step_id, "streaming loop completed");
     Ok(())
 }
 
@@ -1890,52 +1790,52 @@ fn sort_streaming_steps_by_dependencies(
     streaming_steps: Vec<usize>,
 ) -> Result<Vec<usize>> {
     use std::collections::{HashMap, HashSet, VecDeque};
-    
+
     // Create a map of step ID to index for quick lookup
     let step_id_to_index: HashMap<String, usize> = streaming_steps
         .iter()
         .map(|&idx| (flow.steps[idx].id.clone(), idx))
         .collect();
-    
+
     // Build dependency graph for streaming steps only
     let mut dependencies: HashMap<usize, HashSet<usize>> = HashMap::new();
     let mut dependents: HashMap<usize, HashSet<usize>> = HashMap::new();
-    
+
     for &step_idx in &streaming_steps {
         dependencies.insert(step_idx, HashSet::new());
         dependents.insert(step_idx, HashSet::new());
     }
-    
+
     // Analyze dependencies between streaming steps
     for &step_idx in &streaming_steps {
         let step = &flow.steps[step_idx];
-        
+
         // Check if this step's input references other streaming steps
         let input_str = serde_json::to_string(&step.input).unwrap_or_default();
-        
+
         for &other_step_idx in &streaming_steps {
             if step_idx != other_step_idx {
                 let other_step_id = &flow.steps[other_step_idx].id;
-                
+
                 // Check if step references other_step in its input
                 if input_str.contains(&format!("step: {}", other_step_id)) ||
                    input_str.contains(&format!("\"step\": \"{}\"", other_step_id)) {
                     // step_idx depends on other_step_idx
                     dependencies.get_mut(&step_idx).unwrap().insert(other_step_idx);
                     dependents.get_mut(&other_step_idx).unwrap().insert(step_idx);
-                    
-                    tracing::info!("Detected dependency: {} depends on {}", 
+
+                    tracing::info!("Detected dependency: {} depends on {}",
                                  step.id, other_step_id);
                 }
             }
         }
     }
-    
+
     // Topological sort using Kahn's algorithm
     let mut result = Vec::new();
     let mut queue = VecDeque::new();
     let mut remaining_deps = dependencies.clone();
-    
+
     // Find steps with no dependencies (source steps)
     for &step_idx in &streaming_steps {
         if remaining_deps[&step_idx].is_empty() {
@@ -1943,21 +1843,21 @@ fn sort_streaming_steps_by_dependencies(
             tracing::info!("Found source streaming step: {}", flow.steps[step_idx].id);
         }
     }
-    
+
     while let Some(current_step) = queue.pop_front() {
         result.push(current_step);
-        
+
         // Remove this step from its dependents' dependency lists
         for &dependent_step in &dependents[&current_step] {
             remaining_deps.get_mut(&dependent_step).unwrap().remove(&current_step);
-            
+
             // If the dependent now has no dependencies, add it to the queue
             if remaining_deps[&dependent_step].is_empty() {
                 queue.push_back(dependent_step);
             }
         }
     }
-    
+
     // Check for circular dependencies
     if result.len() != streaming_steps.len() {
         let remaining: Vec<String> = streaming_steps
@@ -1965,15 +1865,15 @@ fn sort_streaming_steps_by_dependencies(
             .filter(|&&idx| !result.contains(&idx))
             .map(|&idx| flow.steps[idx].id.clone())
             .collect();
-        
+
         tracing::error!("Circular dependency detected in streaming steps: {:?}", remaining);
         return Err(ExecutionError::Internal.into());
     }
-    
+
     tracing::info!("Topological sort result: {:?}",
         result.iter().map(|i| &flow.steps[*i].id).collect::<Vec<_>>()
-    );
-    
+    ); // Add the closing parenthesis here
+
     Ok(result)
 }
 
@@ -2040,7 +1940,6 @@ mod tests {
     ) -> Result<FlowResult> {
         let (executor, flow, workflow_hash) =
             create_workflow_from_yaml_simple(yaml_str, mock_behaviors).await;
-        let execution_id = Uuid::new_v4();
         let state_store: Arc<dyn StateStore> = Arc::new(InMemoryStateStore::new());
         let input_ref = ValueRef::new(input);
 
@@ -2259,7 +2158,6 @@ output:
         .await
         .unwrap();
 
-        // Initially, only step1 should be runnable
         let runnable = workflow_executor.get_runnable_step_indices();
         assert_eq!(runnable.len(), 1);
         assert!(runnable.contains(0)); // step1
@@ -2318,7 +2216,6 @@ steps:
     input:
       step1:
         $from:
-          step: step1
       step2:
         $from:
           step: step2
@@ -2493,7 +2390,6 @@ steps:
     input:
       mode: error
 output:
-  $from:
     step: failing_step
 "#;
 
@@ -2637,3 +2533,9 @@ output:
     }
 }
 
+
+
+
+
+
+
diff --git a/crates/stepflow-plugin/Cargo.toml b/crates/stepflow-plugin/Cargo.toml
index b0966026..f3c00682 100644
--- a/crates/stepflow-plugin/Cargo.toml
+++ b/crates/stepflow-plugin/Cargo.toml
@@ -23,7 +23,12 @@ serde.workspace = true
 stepflow-core.workspace = true
 stepflow-state.workspace = true
 thiserror.workspace = true
+tokio.workspace = true
 trait-variant.workspace = true
+tracing.workspace = true
 uuid.workspace = true
+dashmap = "6.0"
+once_cell = "1.19"
+serde_json.workspace = true
 
 [dev-dependencies]
\ No newline at end of file
diff --git a/crates/stepflow-plugin/src/lib.rs b/crates/stepflow-plugin/src/lib.rs
index f9f7fba1..388482d2 100644
--- a/crates/stepflow-plugin/src/lib.rs
+++ b/crates/stepflow-plugin/src/lib.rs
@@ -1,6 +1,7 @@
 mod context;
 mod error;
 mod plugin;
+pub mod streaming;
 
 pub use context::{Context, ExecutionContext, Executor};
 pub use error::{PluginError, Result};
diff --git a/crates/stepflow-plugin/src/streaming.rs b/crates/stepflow-plugin/src/streaming.rs
new file mode 100644
index 00000000..6deaff14
--- /dev/null
+++ b/crates/stepflow-plugin/src/streaming.rs
@@ -0,0 +1,32 @@
+use dashmap::DashMap;
+use once_cell::sync::Lazy;
+use serde_json::Value;
+use tokio::sync::mpsc;
+use uuid::Uuid;
+
+/// Maps execution_id → Sender<raw chunk JSON>.
+/// This global registry allows streaming chunk handlers to route chunks without acquiring locks.
+pub static STREAM_CHUNK_SENDERS: Lazy<DashMap<Uuid, mpsc::Sender<Value>>> =
+    Lazy::new(DashMap::new);
+
+/// Register a chunk sender for an execution ID
+pub fn register_chunk_sender(execution_id: Uuid, sender: mpsc::Sender<Value>) {
+    tracing::debug!("Registering chunk sender for execution {}", execution_id);
+    STREAM_CHUNK_SENDERS.insert(execution_id, sender);
+}
+
+/// Unregister a chunk sender for an execution ID (cleanup)
+pub fn unregister_chunk_sender(execution_id: Uuid) {
+    tracing::debug!("Unregistering chunk sender for execution {}", execution_id);
+    STREAM_CHUNK_SENDERS.remove(&execution_id);
+}
+
+/// Send a chunk to the registered sender for an execution ID
+pub async fn send_chunk(execution_id: Uuid, chunk: Value) -> Result<(), String> {
+    if let Some(sender) = STREAM_CHUNK_SENDERS.get(&execution_id) {
+        sender.send(chunk).await
+            .map_err(|e| format!("stream-chunk channel closed: {}", e))
+    } else {
+        Err(format!("no streaming channel for exec {}", execution_id))
+    }
+} 
\ No newline at end of file
diff --git a/crates/stepflow-protocol/src/blob_handlers.rs b/crates/stepflow-protocol/src/blob_handlers.rs
index fa259a9f..78d5ced0 100644
--- a/crates/stepflow-protocol/src/blob_handlers.rs
+++ b/crates/stepflow-protocol/src/blob_handlers.rs
@@ -4,7 +4,7 @@ use futures::future::{BoxFuture, FutureExt as _};
 use serde::{Deserialize, Serialize};
 use serde_json::value::RawValue;
 use std::sync::Arc;
-use stepflow_execution::WorkflowExecutor;
+
 use stepflow_plugin::Context;
 use tokio::sync::mpsc;
 use uuid::Uuid;
@@ -176,70 +176,32 @@ impl IncomingHandler for StreamingChunkHandler {
     ) -> BoxFuture<'static, error_stack::Result<(), StdioError>> {
         async move {
             // This is a notification (no ID), so we don't send a response
-            // Instead, we need to handle the streaming chunk
-                            match serde_json::from_str::<StreamingChunkNotification>(params.get()) {
+            // Instead, we need to route the streaming chunk through the global registry
+            match serde_json::from_str::<StreamingChunkNotification>(params.get()) {
                 Ok(notification) => {
                     tracing::info!("Received streaming chunk for request {}: step_id={:?}, chunk_index={}", 
                                   notification.request_id, notification.step_id, notification.chunk_index);
                     
-                    // Route this chunk to the appropriate workflow executor
-                    if let Some(executor) = context.executor() {
-                        tracing::debug!("Executor available, attempting to parse execution ID: {}", notification.request_id);
+                    if let Ok(execution_id) = Uuid::parse_str(&notification.request_id) {
+                        let chunk = serde_json::json!({
+                            "request_id": notification.request_id,
+                            "stream_id": notification.stream_id,
+                            "chunk_index": notification.chunk_index,
+                            "is_final": notification.is_final,
+                            "step_id": notification.step_id,
+                            "chunk": notification.chunk
+                        });
                         
-                        if let Ok(execution_id) = Uuid::parse_str(&notification.request_id) {
-                            tracing::info!("Successfully parsed execution ID: {}", execution_id);
-                            tracing::info!("Looking up workflow executor for execution ID: {}", execution_id);
-                            
-                            // Try to find the workflow executor for this execution
-                            match executor.get_workflow_executor(execution_id).await {
-                                Ok(Some(workflow_executor_any)) => {
-                                    tracing::info!("Found workflow executor for execution ID: {}", execution_id);
-                                    
-                                    // Downcast to the concrete WorkflowExecutor type
-                                    match workflow_executor_any.downcast::<Arc<tokio::sync::Mutex<WorkflowExecutor>>>() {
-                                        Ok(workflow_executor_arc) => {
-                                            tracing::debug!("Successfully downcast to Arc<Mutex<WorkflowExecutor>>, routing chunk");
-                                            
-                                            // Lock the mutex to access the workflow executor
-                                            let mut workflow_executor = workflow_executor_arc.lock().await;
-                                            
-                                            // Route the chunk to the workflow executor with full metadata
-                                            let chunk_with_metadata = serde_json::json!({
-                                                "request_id": notification.request_id,
-                                                "stream_id": notification.stream_id,
-                                                "chunk_index": notification.chunk_index,
-                                                "is_final": notification.is_final,
-                                                "step_id": notification.step_id,
-                                                "chunk": notification.chunk
-                                            });
-                                            tracing::info!("Sending chunk to workflow executor with step_id={:?}", notification.step_id);
-                                            match workflow_executor.route_streaming_chunk(chunk_with_metadata).await {
-                                                Ok(_) => {
-                                                    tracing::debug!("Successfully routed streaming chunk to workflow executor");
-                                                }
-                                                Err(e) => {
-                                                    tracing::error!("Failed to route streaming chunk to workflow executor: {:?}", e);
-                                                }
-                                            }
-                                        }
-                                        Err(_) => {
-                                            tracing::warn!("Failed to downcast workflow executor to Arc<Mutex<WorkflowExecutor>> type for execution ID: {}", execution_id);
-                                        }
-                                    }
-                                }
-                                Ok(None) => {
-                                tracing::warn!("No workflow executor found for execution ID: {}", execution_id);
-                                    tracing::error!("Failed to route streaming chunk to workflow executor: no executor found for execution ID {}", execution_id);
-                                }
-                                Err(e) => {
-                                    tracing::error!("Error getting workflow executor for execution ID {}: {:?}", execution_id, e);
-                                }
+                        match stepflow_plugin::streaming::send_chunk(execution_id, chunk).await {
+                            Ok(_) => {
+                                tracing::info!("Successfully routed streaming chunk to execution {}", execution_id);
+                            }
+                            Err(e) => {
+                                tracing::error!("Failed to route streaming chunk: {}", e);
                             }
-                        } else {
-                            tracing::warn!("Invalid execution ID in streaming chunk: {}", notification.request_id);
                         }
                     } else {
-                        tracing::warn!("No executor available in context for streaming chunk routing");
+                        tracing::warn!("Invalid execution ID in streaming chunk: {}", notification.request_id);
                     }
                     
                     Ok(())
diff --git a/examples/audio_input.json b/examples/audio_input.json
index 051ba0e5..6a4a01bd 100644
--- a/examples/audio_input.json
+++ b/examples/audio_input.json
@@ -5,7 +5,7 @@
   "channels": 1,
   "chunk_size": 1024,
   "frequency": 440.0,
-  "duration": 3.0,
+  "duration": 5.0,
   "output_file": "output.wav",
   "device_name": "C922 Pro Stream Webcam"
 }
diff --git a/sdks/python/src/stepflow_sdk/audio_components.py b/sdks/python/src/stepflow_sdk/audio_components.py
index 9b811fe8..2af62c6d 100644
--- a/sdks/python/src/stepflow_sdk/audio_components.py
+++ b/sdks/python/src/stepflow_sdk/audio_components.py
@@ -340,6 +340,9 @@ def record_audio_continuously():
                 
                 log_debug(f"DEBUG: Processing chunk {chunk_index}/{total_chunks}, processed={processed_chunks}, is_final={is_final}", "audio_stream_source")
                 
+                if is_final:
+                    log_debug(f"FINAL_CHUNK: Sending final chunk {chunk_index} with is_final=True", "audio_stream_source")
+                
                 # Yield the chunk
                 yield {
                     "outcome": "streaming",
@@ -485,11 +488,14 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         output_file = data.get('output_file', 'output_audio.wav')
     
     log_debug(f"TIMING: audio_chunk_processor starting chunk {chunk_index} at {start_time}", "audio_chunk_processor")
+    log_debug(f"VALIDATION: audio_chunk_processor received chunk_b64 length: {len(chunk_b64)}", "audio_chunk_processor")
+    log_debug(f"VALIDATION: audio_chunk_processor operation: {operation}", "audio_chunk_processor")
     
     # Decode base64 chunk
     chunk_data = base64.b64decode(chunk_b64)
     decode_time = time.time()
     log_debug(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", "audio_chunk_processor")
+    log_debug(f"VALIDATION: decoded chunk_data length: {len(chunk_data)} bytes", "audio_chunk_processor")
     
     # Convert bytes to samples
     samples = []
@@ -619,6 +625,7 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
     log_debug(f"DEBUG: audio_sink output_file: {output_file}", "audio_sink")
     log_debug(f"DEBUG: audio_sink is_final: {is_final}", "audio_sink")
     log_debug(f"DEBUG: audio_sink stream_id: {stream_id}", "audio_sink")
+    log_debug(f"VALIDATION: audio_sink received chunk_b64 length: {len(chunk_b64)}", "audio_sink")
     
     # Decode the chunk
     if chunk_b64:
@@ -678,34 +685,50 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
                 log_debug(f"ERROR: Audio playback failed: {e}", "audio_sink")
         
         # Write WAV file if this is the final chunk
-        if is_final and stream_id in audio_sink._chunk_storage:
-            try:
-                log_debug(f"DEBUG: Writing final WAV file: {output_file}", "audio_sink")
-                storage = audio_sink._chunk_storage[stream_id]
-                all_audio_data = b''.join(storage['chunks'])
-                
-                # Ensure the output directory exists
-                output_dir = os.path.dirname(output_file)
-                if output_dir and not os.path.exists(output_dir):
-                    log_debug(f"DEBUG: Creating output directory: {output_dir}", "audio_sink")
-                    os.makedirs(output_dir, exist_ok=True)
-                
-                log_debug(f"DEBUG: Writing {len(all_audio_data)} bytes to {output_file}", "audio_sink")
-                with wave.open(output_file, 'wb') as wav_file:
-                    wav_file.setnchannels(storage['channels'])
-                    wav_file.setsampwidth(2)  # 16-bit
-                    wav_file.setframerate(storage['sample_rate'])
-                    wav_file.writeframes(all_audio_data)
-                
-                log_debug(f"DEBUG: WAV file written successfully: {output_file} ({len(all_audio_data)} bytes)", "audio_sink")
-                
-                # Clean up storage for this stream
-                del audio_sink._chunk_storage[stream_id]
-                
-            except Exception as e:
-                log_debug(f"ERROR: Failed to write WAV file {output_file}: {e}", "audio_sink")
-                import traceback
-                traceback.print_exc(file=sys.stderr)
+        if is_final:
+            log_debug(f"DEBUG: Final chunk received - checking storage for stream {stream_id}", "audio_sink")
+            log_debug(f"DEBUG: Available streams in storage: {list(audio_sink._chunk_storage.keys())}", "audio_sink")
+            
+            if stream_id in audio_sink._chunk_storage:
+                try:
+                    log_debug(f"DEBUG: Writing final WAV file: {output_file}", "audio_sink")
+                    storage = audio_sink._chunk_storage[stream_id]
+                    all_audio_data = b''.join(storage['chunks'])
+                    
+                    log_debug(f"DEBUG: Total chunks collected: {len(storage['chunks'])}", "audio_sink")
+                    log_debug(f"DEBUG: Total audio data size: {len(all_audio_data)} bytes", "audio_sink")
+                    
+                    # Ensure the output directory exists
+                    output_dir = os.path.dirname(output_file)
+                    if output_dir and not os.path.exists(output_dir):
+                        log_debug(f"DEBUG: Creating output directory: {output_dir}", "audio_sink")
+                        os.makedirs(output_dir, exist_ok=True)
+                    
+                    log_debug(f"DEBUG: Writing {len(all_audio_data)} bytes to {output_file}", "audio_sink")
+                    with wave.open(output_file, 'wb') as wav_file:
+                        wav_file.setnchannels(storage['channels'])
+                        wav_file.setsampwidth(2)  # 16-bit
+                        wav_file.setframerate(storage['sample_rate'])
+                        wav_file.writeframes(all_audio_data)
+                    
+                    log_debug(f"SUCCESS: WAV file written successfully: {output_file} ({len(all_audio_data)} bytes)", "audio_sink")
+                    
+                    # Verify file was created
+                    if os.path.exists(output_file):
+                        file_size = os.path.getsize(output_file)
+                        log_debug(f"SUCCESS: WAV file exists on disk: {output_file} ({file_size} bytes)", "audio_sink")
+                    else:
+                        log_debug(f"ERROR: WAV file not found on disk after writing: {output_file}", "audio_sink")
+                    
+                    # Clean up storage for this stream
+                    del audio_sink._chunk_storage[stream_id]
+                    
+                except Exception as e:
+                    log_debug(f"ERROR: Failed to write WAV file {output_file}: {e}", "audio_sink")
+                    import traceback
+                    traceback.print_exc(file=sys.stderr)
+            else:
+                log_debug(f"ERROR: Stream {stream_id} not found in storage when final chunk received", "audio_sink")
         
         result = {
             "outcome": "success",

From f1264834523d072d6e5e25143d3c87dcafecbde2 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Thu, 26 Jun 2025 16:06:05 -0400
Subject: [PATCH 12/14] pipeline exits now

---
 .../stepflow-execution/src/workflow_executor.rs | 17 +++++++++++++----
 1 file changed, 13 insertions(+), 4 deletions(-)

diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index 64911ee0..d920789a 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -1275,10 +1275,19 @@ impl StreamingPipelineCoordinator {
                 
                 // Spawn while still holding the pieces and the lock
                 let h = tokio::spawn(async move {
-                    tracing::info!("Step task {} about to call run_streaming_step_simple", step_id);
-                    let result = run_streaming_step_simple(plugin, step, input, context, rx, downstream, is_source).await;
-                    tracing::info!("Step task {} finished run_streaming_step_simple: {:?}", step_id, result.is_ok());
-                    result
+                    if is_source {
+                        tracing::info!("Step task {} is source - waiting for generator to complete", step_id);
+                        // For source steps, don't run the generator here (it's run separately)
+                        // Just wait a bit and then exit - the generator runs independently
+                        tokio::time::sleep(std::time::Duration::from_millis(100)).await;
+                        tracing::info!("Step task {} source step exiting (generator runs separately)", step_id);
+                        Ok(())
+                    } else {
+                        tracing::info!("Step task {} about to call run_streaming_step_simple", step_id);
+                        let result = run_streaming_step_simple(plugin, step, input, context, rx, downstream, is_source).await;
+                        tracing::info!("Step task {} finished run_streaming_step_simple: {:?}", step_id, result.is_ok());
+                        result
+                    }
                 });
                 handles.push((step_idx, h));
             }

From 42eebfcd54a0fe5ecef13650b71a354c7e881e04 Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Thu, 26 Jun 2025 16:14:00 -0400
Subject: [PATCH 13/14] less logging

---
 .../src/workflow_executor.rs                  | 51 ++---------
 .../src/stepflow_sdk/audio_components.py      | 85 -------------------
 2 files changed, 5 insertions(+), 131 deletions(-)

diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index d920789a..f843a4de 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -1437,16 +1437,11 @@ impl StreamingPipelineCoordinator {
         // If we have a nested chunk object, also check its is_final flag (it takes precedence)
         if let Some(chunk_obj) = map.get("chunk").and_then(|v| v.as_object()) {
             if let Some(nested_is_final) = chunk_obj.get("is_final").and_then(|v| v.as_bool()) {
-                tracing::warn!("CHUNK_ROUTING_DEBUG: Using nested is_final={} instead of top-level is_final={}", nested_is_final, is_final);
                 is_final = nested_is_final;
             }
         }
 
         tracing::debug!("Routing chunk {} from step {:?} (is_final={})", chunk_index, source_step_id, is_final);
-        
-        if is_final {
-            tracing::warn!("FINAL_CHUNK_TRACKING: Routing final chunk {} from step {:?}", chunk_index, source_step_id);
-        }
 
         // Get the information we need from the coordinator briefly
         let (target_step_id, step_senders) = {
@@ -1486,38 +1481,25 @@ impl StreamingPipelineCoordinator {
 
         // Send to the target step's channel
         if let Some(tx) = step_senders.get(&target_step_id) {
-            // Debug the map structure
-            tracing::warn!("CHUNK_ROUTING_DEBUG: map keys: {:?}", map.keys().collect::<Vec<_>>());
-            
             // Extract chunk data - handle nested component response format
             let chunk_str = if let Some(chunk_value) = map.get("chunk") {
-                tracing::warn!("CHUNK_ROUTING_DEBUG: found chunk field, type: {:?}", std::mem::discriminant(chunk_value));
-                
                 if let Some(chunk_str) = chunk_value.as_str() {
                     // Direct string chunk
-                    tracing::warn!("CHUNK_ROUTING_DEBUG: chunk as string, len: {}", chunk_str.len());
                     chunk_str
                 } else if let Some(chunk_obj) = chunk_value.as_object() {
                     // Nested object - extract the inner "chunk" field
-                    tracing::warn!("CHUNK_ROUTING_DEBUG: chunk is nested object, extracting inner chunk");
                     if let Some(inner_chunk) = chunk_obj.get("chunk").and_then(|v| v.as_str()) {
-                        tracing::warn!("CHUNK_ROUTING_DEBUG: extracted inner chunk, len: {}", inner_chunk.len());
                         inner_chunk
                     } else {
-                        tracing::warn!("CHUNK_ROUTING_DEBUG: no inner chunk field found in nested object");
                         ""
                     }
                 } else {
-                    tracing::warn!("CHUNK_ROUTING_DEBUG: chunk field is not a string or object");
                     ""
                 }
             } else {
-                tracing::warn!("CHUNK_ROUTING_DEBUG: no chunk field found");
                 ""
             };
             
-            tracing::warn!("CHUNK_ROUTING_DEBUG: final extracted chunk_str_len={}", chunk_str.len());
-            
             // Create a FlowResult from the chunk data
             let fr = FlowResult::Streaming {
                 stream_id: map.get("stream_id").and_then(|v| v.as_str()).unwrap_or("unknown").to_string(),
@@ -1622,7 +1604,7 @@ async fn run_streaming_step_simple(
     let mut last_is_final = false;
 
     loop {
-        stream_log!(info, &step_id, "waiting for chunk via receiver (is_closed: {})", rx.is_closed());
+        stream_log!(debug, &step_id, "waiting for chunk via receiver");
 
         // Check if the channel has been closed already
         if rx.is_closed() {
@@ -1648,12 +1630,7 @@ async fn run_streaming_step_simple(
 
         match recv_result {
             Some(FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final }) => {
-                stream_log!(info, &step_id, "RECEIVED chunk #{} from receiver (chunk len: {})", chunk_index, chunk.len());
-                stream_log!(info, &step_id, "processing chunk #{} (is_final={}) - VALIDATION: received chunk len={}", chunk_index, is_final, chunk.len());
-                
-                if is_final {
-                    stream_log!(warn, &step_id, "FINAL_CHUNK_TRACKING: Received final chunk #{} - will forward to downstream", chunk_index);
-                }
+                stream_log!(info, &step_id, "processing chunk #{} (is_final={})", chunk_index, is_final);
 
                 // Store the streaming metadata for potential use in non-streaming case
                 last_stream_id = stream_id.clone();
@@ -1666,8 +1643,6 @@ async fn run_streaming_step_simple(
                 let (final_stream_id, final_metadata, final_chunk, final_chunk_index, final_is_final) =
                 if !is_source {
                     // For non-source steps, process the chunk with the component
-                    stream_log!(info, &step_id, "calling component with chunk #{} (input chunk len: {})", chunk_index, chunk.len());
-
                     // Create input for the component from the chunk
                     let chunk_input_data = serde_json::json!({
                         "stream_id": stream_id,
@@ -1679,7 +1654,6 @@ async fn run_streaming_step_simple(
 
                     // Call the component with the chunk
                     let chunk_input = stepflow_core::workflow::ValueRef::new(chunk_input_data);
-                    stream_log!(info, &step_id, "sending input to component: chunk_len={}, stream_id={}", chunk.len(), stream_id);
                     
                     let component_result = execute_step_async(
                         plugin.clone(),
@@ -1690,13 +1664,10 @@ async fn run_streaming_step_simple(
 
                     match component_result {
                         Ok(FlowResult::Success { result }) => {
-                            stream_log!(info, &step_id, "component returned success for chunk #{}", chunk_index);
                             // For success results, forward the original chunk
                             (stream_id, metadata, chunk, chunk_index, is_final)
                         }
                         Ok(FlowResult::Streaming { stream_id: new_stream_id, metadata: new_metadata, chunk: new_chunk, chunk_index: new_chunk_index, is_final: new_is_final }) => {
-                            stream_log!(info, &step_id, "component returned streaming result for chunk #{} - OUTPUT chunk len: {}", chunk_index, new_chunk.len());
-                            stream_log!(warn, &step_id, "VALIDATION: input_chunk_len={}, output_chunk_len={}, input_stream_id={}, output_stream_id={}", chunk.len(), new_chunk.len(), stream_id, new_stream_id);
                             // Component returned a streaming result, use it
                             (new_stream_id, new_metadata, new_chunk, new_chunk_index, new_is_final)
                         }
@@ -1716,11 +1687,6 @@ async fn run_streaming_step_simple(
                 };
 
                 // Forward to downstream steps
-                stream_log!(info, &step_id, "forwarding chunk #{} to {} downstream steps (final_chunk len: {}) is_final={}", final_chunk_index, downstream.len(), final_chunk.len(), final_is_final);
-                
-                if final_is_final {
-                    stream_log!(warn, &step_id, "FINAL_CHUNK_TRACKING: Forwarding final chunk #{} to {} downstream steps", final_chunk_index, downstream.len());
-                }
 
                 if downstream.is_empty() {
                     stream_log!(warn, &step_id, "no downstream channels to forward to!");
@@ -1755,18 +1721,11 @@ async fn run_streaming_step_simple(
 
                     match tx.send(fr).await {
                         Ok(_) => {
-                            stream_log!(info, &step_id, "forwarded chunk #{} to downstream[{}] (step {}) is_final={}",
-                                final_chunk_index, i, downstream_id, final_is_final);
-                            if final_is_final {
-                                stream_log!(warn, &step_id, "FINAL_CHUNK_TRACKING: Successfully forwarded final chunk to step {}", downstream_id);
-                            }
+                            stream_log!(debug, &step_id, "forwarded chunk #{} to step {}", final_chunk_index, downstream_id);
                         }
                         Err(e) => {
-                            stream_log!(error, &step_id, "failed to forward chunk #{} to downstream[{}] (step {}): {:?}",
-                                final_chunk_index, i, downstream_id, e);
-                            if final_is_final {
-                                stream_log!(error, &step_id, "FINAL_CHUNK_TRACKING: FAILED to forward final chunk to step {}: {:?}", downstream_id, e);
-                            }
+                            stream_log!(error, &step_id, "failed to forward chunk #{} to step {}: {:?}",
+                                final_chunk_index, downstream_id, e);
                         }
                     }
                 }
diff --git a/sdks/python/src/stepflow_sdk/audio_components.py b/sdks/python/src/stepflow_sdk/audio_components.py
index 2af62c6d..5f7bd9a2 100644
--- a/sdks/python/src/stepflow_sdk/audio_components.py
+++ b/sdks/python/src/stepflow_sdk/audio_components.py
@@ -18,9 +18,6 @@
 import numpy as np
 import datetime
 
-# GUARANTEED DEBUG OUTPUT - This should appear every time the module is loaded
-sys.stderr.write("=== AUDIO_COMPONENTS.PY MODULE LOADED ===\n")
-sys.stderr.flush()
 
 try:
     import sounddevice as sd
@@ -115,7 +112,6 @@ def start_system_audio_stream(self):
         if not self.device_info:
             raise RuntimeError("No suitable system audio device found")
         
-        log_debug(f"Using system audio device: {self.device_info['name']}", "audio_stream_source")
     
     def _find_system_audio_device(self):
         """Find a suitable system audio device."""
@@ -182,10 +178,6 @@ def audio_stream_source(data: Dict[str, Any], context=None):
     Output:
         Streaming audio chunks with metadata
     """
-    # Test stderr output
-    log_debug("TEST: audio_stream_source function called", "audio_stream_source")
-    
-    log_debug(f"audio_stream_source received input data: {data}", "audio_stream_source")
     
     # Extract parameters from input data
     source_type = data.get('source', 'sine_wave')
@@ -197,16 +189,12 @@ def audio_stream_source(data: Dict[str, Any], context=None):
     frequency = data.get('frequency', 440.0)
     output_file = data.get('output_file', 'output_audio.wav')
     
-    log_debug(f"Extracted parameters - source_type: {source_type}, requested_sample_rate: {requested_sample_rate}, device_name: {device_name}", "audio_stream_source")
     
     start_time = time.time()
     
-    # Debug: Print the actual input data
-    log_debug(f"DEBUG: audio_stream_source received input data: {data}", "audio_stream_source")
     
     stream_id = str(uuid.uuid4())
     
-    log_debug(f"TIMING: Starting audio_stream_source at {start_time}", "audio_stream_source")
     
     # Initialize PyAudio
     audio = pyaudio.PyAudio()
@@ -218,7 +206,6 @@ def audio_stream_source(data: Dict[str, Any], context=None):
             info = audio.get_device_info_by_index(i)
             if device_name.lower() in info['name'].lower():
                 device_index = i
-                log_debug(f"Found device: {info['name']} (index {i})", "audio_stream_source")
                 break
     
     # Auto-detect sample rate if device is specified and requested rate fails
@@ -234,9 +221,7 @@ def audio_stream_source(data: Dict[str, Any], context=None):
                                     frames_per_buffer=chunk_size)
             test_stream.close()
             sample_rate = requested_sample_rate
-            log_debug(f"Using requested sample rate: {sample_rate} Hz for device", "audio_stream_source")
         except OSError:
-            log_debug(f"Requested sample rate {requested_sample_rate} Hz not supported, trying alternatives...", "audio_stream_source")
             # Try alternative sample rates if requested rate fails
             sample_rates = [16000, 22050, 44100, 48000]
             for rate in sample_rates:
@@ -251,7 +236,6 @@ def audio_stream_source(data: Dict[str, Any], context=None):
                                             frames_per_buffer=chunk_size)
                     test_stream.close()
                     sample_rate = rate
-                    log_debug(f"Using alternative sample rate: {sample_rate} Hz for device", "audio_stream_source")
                     break
                 except OSError:
                     continue
@@ -260,10 +244,6 @@ def audio_stream_source(data: Dict[str, Any], context=None):
     chunk_duration = chunk_size / sample_rate  # seconds per chunk
     total_chunks = int(duration / chunk_duration)
     
-    log_debug(f"DEBUG: Generating {total_chunks} chunks for {duration}s audio at {sample_rate}Hz", "audio_stream_source")
-    log_debug(f"DEBUG: chunk_duration={chunk_duration}s, chunk_size={chunk_size} samples", "audio_stream_source")
-    log_debug(f"DEBUG: duration={duration}s, sample_rate={sample_rate}Hz", "audio_stream_source")
-    log_debug(f"DEBUG: total_chunks calculation: {duration} / {chunk_duration} = {total_chunks}", "audio_stream_source")
     
     # Collect all chunks for direct WAV file writing
     all_chunks = []
@@ -296,7 +276,6 @@ def record_audio_continuously():
                         frames_per_buffer=chunk_size
                     )
                 
-                log_debug(f"Started continuous recording from device {device_index}", "audio_stream_source")
                 
                 chunk_index = 0
                 while not recording_stop.is_set() and chunk_index < total_chunks:
@@ -304,27 +283,20 @@ def record_audio_continuously():
                         data = stream.read(chunk_size, exception_on_overflow=False)
                         audio_queue.put((chunk_index, data))
                         chunk_index += 1
-                        log_debug(f"DEBUG: Recording thread put chunk {chunk_index}/{total_chunks} in queue", "audio_stream_source")
-                        if chunk_index % 10 == 0:  # Log every 10th chunk
-                            log_debug(f"DEBUG: Recording thread recorded chunk {chunk_index}/{total_chunks}", "audio_stream_source")
                     except Exception as e:
-                        log_debug(f"Recording error: {e}", "audio_stream_source")
                         recording_error = e
                         break
                 
                 stream.stop_stream()
                 stream.close()
-                log_debug(f"Recording thread completed after {chunk_index} chunks", "audio_stream_source")
                 
             except Exception as e:
-                log_debug(f"Failed to start recording: {e}", "audio_stream_source")
                 recording_error = e
     
         # Start recording thread
         recording_thread = threading.Thread(target=record_audio_continuously, daemon=True)
         recording_thread.start()
         
-        log_debug(f"DEBUG: Started continuous recording thread", "audio_stream_source")
         
         # Process chunks from the recording thread
         processed_chunks = 0
@@ -338,10 +310,6 @@ def record_audio_continuously():
                 # Determine if this is the final chunk
                 is_final = chunk_index >= total_chunks - 1
                 
-                log_debug(f"DEBUG: Processing chunk {chunk_index}/{total_chunks}, processed={processed_chunks}, is_final={is_final}", "audio_stream_source")
-                
-                if is_final:
-                    log_debug(f"FINAL_CHUNK: Sending final chunk {chunk_index} with is_final=True", "audio_stream_source")
                 
                 # Yield the chunk
                 yield {
@@ -360,16 +328,13 @@ def record_audio_continuously():
                 processed_chunks += 1
                 
             except Exception as e:
-                log_debug(f"DEBUG: Error processing chunk {processed_chunks}: {e}", "audio_stream_source")
                 break
         
-        log_debug(f"DEBUG: Main loop completed after processing {processed_chunks} chunks", "audio_stream_source")
         
         # Stop recording
         recording_stop.set()
         recording_thread.join(timeout=2.0)
         
-        log_debug(f"DEBUG: Microphone recording loop completed. Processed {len(all_chunks)} chunks out of {total_chunks} expected.", "audio_stream_source")
         
         # Check for any recording errors after completion
         if recording_error:
@@ -386,7 +351,6 @@ def record_audio_continuously():
                 chunk = source.get_system_audio_chunk()
                 
                 audio_capture_time = time.time()
-                log_debug(f"TIMING: System audio capture took {audio_capture_time - chunk_start_time:.4f}s", "audio_stream_source")
                 
                 all_chunks.append(chunk.data)
                 chunk_b64 = base64.b64encode(chunk.data).decode('utf-8')
@@ -405,7 +369,6 @@ def record_audio_continuously():
                     "output_file": output_file
                 }
         except Exception as e:
-            log_debug(f"System audio capture failed: {e}. Raising error instead of falling back.", "audio_stream_source")
             raise RuntimeError(f"System audio capture failed: {e}")
     
     elif source_type == 'sine_wave':
@@ -417,7 +380,6 @@ def record_audio_continuously():
             chunk = source.generate_sine_wave_chunk(frequency, chunk_duration)
             
             audio_capture_time = time.time()
-            log_debug(f"TIMING: Sine wave generation took {audio_capture_time - chunk_start_time:.4f}s", "audio_stream_source")
             
             all_chunks.append(chunk.data)
             chunk_b64 = base64.b64encode(chunk.data).decode('utf-8')
@@ -438,13 +400,10 @@ def record_audio_continuously():
     else:
         raise ValueError(f"Unsupported audio source type: {source_type}. Supported types: microphone, system_audio, sine_wave")
     
-    log_debug(f"DEBUG: Generator loop completed. Processed {len(all_chunks)} chunks.", "audio_stream_source")
     
     # Note: WAV file writing is now handled by the audio_sink component
     # to ensure we write the processed audio, not just the source audio
     
-    total_time = time.time() - start_time
-    log_debug(f"TIMING: Total audio_stream_source execution took {total_time:.4f}s", "audio_stream_source")
 
 
 def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
@@ -487,15 +446,8 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         operation = data.get('operation', 'passthrough')
         output_file = data.get('output_file', 'output_audio.wav')
     
-    log_debug(f"TIMING: audio_chunk_processor starting chunk {chunk_index} at {start_time}", "audio_chunk_processor")
-    log_debug(f"VALIDATION: audio_chunk_processor received chunk_b64 length: {len(chunk_b64)}", "audio_chunk_processor")
-    log_debug(f"VALIDATION: audio_chunk_processor operation: {operation}", "audio_chunk_processor")
-    
     # Decode base64 chunk
     chunk_data = base64.b64decode(chunk_b64)
-    decode_time = time.time()
-    log_debug(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", "audio_chunk_processor")
-    log_debug(f"VALIDATION: decoded chunk_data length: {len(chunk_data)} bytes", "audio_chunk_processor")
     
     # Convert bytes to samples
     samples = []
@@ -503,8 +455,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         sample = int.from_bytes(chunk_data[i:i+2], 'little', signed=True)
         samples.append(sample)
     
-    convert_time = time.time()
-    log_debug(f"TIMING: Sample conversion took {convert_time - decode_time:.4f}s", "audio_chunk_processor")
     
     if operation == "amplify":
         # Amplify the audio (multiply by gain factor)
@@ -515,8 +465,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         amplified_data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in amplified_samples)
         amplified_b64 = base64.b64encode(amplified_data).decode('utf-8')
         
-        process_time = time.time()
-        log_debug(f"TIMING: Amplification processing took {process_time - convert_time:.4f}s", "audio_chunk_processor")
         
         result = {
             "outcome": "streaming",
@@ -540,8 +488,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         else:
             max_amplitude = avg_amplitude = rms = 0
         
-        process_time = time.time()
-        log_debug(f"TIMING: Analysis processing took {process_time - convert_time:.4f}s", "audio_chunk_processor")
         
         result = {
             "outcome": "success",
@@ -571,8 +517,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
             "output_file": output_file
         }
     
-    total_time = time.time() - start_time
-    log_debug(f"TIMING: audio_chunk_processor total time for chunk {chunk_index}: {total_time:.4f}s", "audio_chunk_processor")
     
     return result
 
@@ -621,17 +565,10 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         output_file = data.get('output_file', 'output_audio.wav')
         play_audio = data.get('play_audio', False)
     
-    log_debug(f"TIMING: audio_sink starting chunk {chunk_index} at {start_time}", "audio_sink")
-    log_debug(f"DEBUG: audio_sink output_file: {output_file}", "audio_sink")
-    log_debug(f"DEBUG: audio_sink is_final: {is_final}", "audio_sink")
-    log_debug(f"DEBUG: audio_sink stream_id: {stream_id}", "audio_sink")
-    log_debug(f"VALIDATION: audio_sink received chunk_b64 length: {len(chunk_b64)}", "audio_sink")
     
     # Decode the chunk
     if chunk_b64:
         chunk_data = base64.b64decode(chunk_b64)
-        decode_time = time.time()
-        log_debug(f"TIMING: Base64 decode took {decode_time - start_time:.4f}s", "audio_sink")
         
         # Store the chunk for later writing
         if stream_id not in audio_sink._chunk_storage:
@@ -644,7 +581,6 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         
         audio_sink._chunk_storage[stream_id]['chunks'].append(chunk_data)
         
-        log_debug(f"DEBUG: Stored chunk {chunk_index} for stream {stream_id}, total chunks: {len(audio_sink._chunk_storage[stream_id]['chunks'])}", "audio_sink")
         
         # Convert to samples for analysis
         samples = []
@@ -660,8 +596,6 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         else:
             max_amplitude = avg_amplitude = rms = 0
         
-        analysis_time = time.time()
-        log_debug(f"TIMING: Audio analysis took {analysis_time - decode_time:.4f}s", "audio_sink")
         
         # Play audio if requested
         if play_audio:
@@ -676,59 +610,42 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
                 sd.play(audio_array, samplerate=sample_rate)
                 sd.wait()
                 
-                play_time = time.time()
-                log_debug(f"TIMING: Audio playback took {play_time - analysis_time:.4f}s", "audio_sink")
                 
             except ImportError:
-                log_debug("WARNING: sounddevice not available, skipping audio playback", "audio_sink")
             except Exception as e:
-                log_debug(f"ERROR: Audio playback failed: {e}", "audio_sink")
         
         # Write WAV file if this is the final chunk
         if is_final:
-            log_debug(f"DEBUG: Final chunk received - checking storage for stream {stream_id}", "audio_sink")
-            log_debug(f"DEBUG: Available streams in storage: {list(audio_sink._chunk_storage.keys())}", "audio_sink")
             
             if stream_id in audio_sink._chunk_storage:
                 try:
-                    log_debug(f"DEBUG: Writing final WAV file: {output_file}", "audio_sink")
                     storage = audio_sink._chunk_storage[stream_id]
                     all_audio_data = b''.join(storage['chunks'])
                     
-                    log_debug(f"DEBUG: Total chunks collected: {len(storage['chunks'])}", "audio_sink")
-                    log_debug(f"DEBUG: Total audio data size: {len(all_audio_data)} bytes", "audio_sink")
                     
                     # Ensure the output directory exists
                     output_dir = os.path.dirname(output_file)
                     if output_dir and not os.path.exists(output_dir):
-                        log_debug(f"DEBUG: Creating output directory: {output_dir}", "audio_sink")
                         os.makedirs(output_dir, exist_ok=True)
                     
-                    log_debug(f"DEBUG: Writing {len(all_audio_data)} bytes to {output_file}", "audio_sink")
                     with wave.open(output_file, 'wb') as wav_file:
                         wav_file.setnchannels(storage['channels'])
                         wav_file.setsampwidth(2)  # 16-bit
                         wav_file.setframerate(storage['sample_rate'])
                         wav_file.writeframes(all_audio_data)
                     
-                    log_debug(f"SUCCESS: WAV file written successfully: {output_file} ({len(all_audio_data)} bytes)", "audio_sink")
                     
                     # Verify file was created
                     if os.path.exists(output_file):
                         file_size = os.path.getsize(output_file)
-                        log_debug(f"SUCCESS: WAV file exists on disk: {output_file} ({file_size} bytes)", "audio_sink")
-                    else:
-                        log_debug(f"ERROR: WAV file not found on disk after writing: {output_file}", "audio_sink")
                     
                     # Clean up storage for this stream
                     del audio_sink._chunk_storage[stream_id]
                     
                 except Exception as e:
-                    log_debug(f"ERROR: Failed to write WAV file {output_file}: {e}", "audio_sink")
                     import traceback
                     traceback.print_exc(file=sys.stderr)
             else:
-                log_debug(f"ERROR: Stream {stream_id} not found in storage when final chunk received", "audio_sink")
         
         result = {
             "outcome": "success",
@@ -755,7 +672,5 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
             }
         }
     
-    total_time = time.time() - start_time
-    log_debug(f"TIMING: audio_sink total time for chunk {chunk_index}: {total_time:.4f}s", "audio_sink")
     
     return result 
\ No newline at end of file

From c1896202172a808a0759b5ef4608fb00affe57fd Mon Sep 17 00:00:00 2001
From: phact <estevezsebastian@gmail.com>
Date: Thu, 26 Jun 2025 16:22:59 -0400
Subject: [PATCH 14/14] some cleanup

---
 .../src/workflow_executor.rs                  | 99 ++++---------------
 .../src/stepflow_sdk/audio_components.py      | 21 ++--
 2 files changed, 26 insertions(+), 94 deletions(-)

diff --git a/crates/stepflow-execution/src/workflow_executor.rs b/crates/stepflow-execution/src/workflow_executor.rs
index f843a4de..6c6c58cc 100644
--- a/crates/stepflow-execution/src/workflow_executor.rs
+++ b/crates/stepflow-execution/src/workflow_executor.rs
@@ -174,7 +174,7 @@ impl WorkflowExecutor {
 
     /// Check if the streaming pipeline is still active (has active receivers)
     pub fn is_streaming_pipeline_active(&self) -> bool {
-        if let Some(coord_arc) = &self.streaming_coordinator {
+        if let Some(_coord_arc) = &self.streaming_coordinator {
             // For now, just check if coordinator exists - we can't easily check receivers without async
             true
         } else {
@@ -584,7 +584,7 @@ impl WorkflowExecutor {
         // Resolve step inputs
         let step_input = match self.resolver.resolve(&step.input).await? {
             FlowResult::Success { result } => result,
-            FlowResult::Streaming { stream_id, metadata, chunk, chunk_index, is_final } => {
+            FlowResult::Streaming { stream_id: _, metadata, chunk: _, chunk_index: _, is_final: _ } => {
                 // For streaming steps, we can handle streaming inputs
                 // For now, just return the metadata as the input
                 metadata
@@ -595,7 +595,7 @@ impl WorkflowExecutor {
                 }
                 .into());
             }
-            FlowResult::Failed { error } => {
+            FlowResult::Failed { error: _ } => {
                 return Err(ExecutionError::StepFailed { step: step_id }.into());
             }
         };
@@ -976,67 +976,6 @@ impl WorkflowExecutor {
         Ok(())
     }
 
-    /// Find all steps that are part of the same streaming pipeline
-    fn find_streaming_pipeline_steps(&self, start_step_index: usize) -> Vec<usize> {
-        let mut pipeline_steps = vec![start_step_index];
-        let mut to_check = vec![start_step_index];
-        let mut checked = std::collections::HashSet::new();
-
-        while let Some(step_index) = to_check.pop() {
-            if checked.contains(&step_index) {
-                continue;
-            }
-            checked.insert(step_index);
-
-            let step = &self.flow.steps[step_index];
-            
-            // Find steps that this step depends on (streaming inputs)
-            for (other_index, other_step) in self.flow.steps.iter().enumerate() {
-                if other_step.streaming && self.step_references_other_step(step, other_step) {
-                    if !pipeline_steps.contains(&other_index) {
-                        pipeline_steps.push(other_index);
-                        to_check.push(other_index);
-                    }
-                }
-            }
-
-            // Find steps that depend on this step (streaming outputs)
-            for (other_index, other_step) in self.flow.steps.iter().enumerate() {
-                if other_step.streaming && self.step_references_other_step(other_step, step) {
-                    if !pipeline_steps.contains(&other_index) {
-                        pipeline_steps.push(other_index);
-                        to_check.push(other_index);
-                    }
-                }
-            }
-        }
-
-        pipeline_steps.sort();
-        pipeline_steps
-    }
-
-
-    /// Find currently active streaming steps using in-memory workflow information
-    /// This avoids depending on state store data that might be cleaned up
-    fn find_active_streaming_steps_in_memory(&self) -> Vec<usize> {
-        let mut active_steps = Vec::new();
-        
-        for (step_index, step) in self.flow.steps.iter().enumerate() {
-            if step.streaming {
-                // For streaming steps, assume they are active if they exist in the coordinator
-                if let Some(_coord_arc) = &self.streaming_coordinator {
-                    // For now, just assume all streaming steps are active
-                    // We can't easily check step_receivers without async
-                    active_steps.push(step_index);
-                    tracing::debug!("Found active streaming step {} in coordinator", step_index);
-                }
-            }
-        }
-        
-        tracing::debug!("Found {} active streaming steps: {:?}", active_steps.len(), active_steps);
-        active_steps
-    }
-
 }
 
 impl Drop for WorkflowExecutor {
@@ -1349,7 +1288,7 @@ impl StreamingPipelineCoordinator {
         let mut incoming_chunks_rx = {
             let mut guard = coord_arc.lock().await;
             // Move the receiver out of the coordinator for the main loop
-            let (dummy_tx, dummy_rx) = mpsc::channel::<serde_json::Value>(1);
+            let (_dummy_tx, dummy_rx) = mpsc::channel::<serde_json::Value>(1);
             std::mem::replace(&mut guard.incoming_chunks, dummy_rx)
         };
 
@@ -1375,7 +1314,7 @@ impl StreamingPipelineCoordinator {
                     // Check if any handles are ready
                     let mut i = 0;
                     while i < remaining_handles.len() {
-                        let (step_idx, handle) = &mut remaining_handles[i];
+                        let (_step_idx, handle) = &mut remaining_handles[i];
                         if handle.is_finished() {
                             let (step_idx, handle) = remaining_handles.remove(i);
                             let step_id = &flow.steps[step_idx].id;
@@ -1557,7 +1496,7 @@ impl StreamingPipelineCoordinator {
                     }
                     .into());
                 }
-                FlowResult::Failed { error } => {
+                FlowResult::Failed { error: _ } => {
                     return Err(ExecutionError::StepFailed { step: step.id.clone() }.into());
                 }
             };
@@ -1573,7 +1512,7 @@ impl StreamingPipelineCoordinator {
 async fn run_streaming_step_simple(
     plugin: Arc<DynPlugin<'static>>,
     step: stepflow_core::workflow::Step,
-    input: stepflow_core::workflow::ValueRef,
+    _input: stepflow_core::workflow::ValueRef,
     context: ExecutionContext,
     mut rx: mpsc::Receiver<FlowResult>,
     downstream: Vec<(String, mpsc::Sender<FlowResult>)>,
@@ -1597,11 +1536,11 @@ async fn run_streaming_step_simple(
     }
 
     // Now loop for all chunks coming through the coordinator's routing system
-    let mut last_stream_id = String::new();
-    let mut last_metadata = stepflow_core::workflow::ValueRef::new(serde_json::Value::Null);
-    let mut last_chunk = String::new();
-    let mut last_chunk_index = 0;
-    let mut last_is_final = false;
+    let mut _last_stream_id = String::new();
+    let mut _last_metadata = stepflow_core::workflow::ValueRef::new(serde_json::Value::Null);
+    let mut _last_chunk = String::new();
+    let mut _last_chunk_index = 0;
+    let mut _last_is_final = false;
 
     loop {
         stream_log!(debug, &step_id, "waiting for chunk via receiver");
@@ -1633,11 +1572,11 @@ async fn run_streaming_step_simple(
                 stream_log!(info, &step_id, "processing chunk #{} (is_final={})", chunk_index, is_final);
 
                 // Store the streaming metadata for potential use in non-streaming case
-                last_stream_id = stream_id.clone();
-                last_metadata = metadata.clone();
-                last_chunk = chunk.clone();
-                last_chunk_index = chunk_index;
-                last_is_final = is_final;
+                _last_stream_id = stream_id.clone();
+                _last_metadata = metadata.clone();
+                _last_chunk = chunk.clone();
+                _last_chunk_index = chunk_index;
+                _last_is_final = is_final;
 
                 // Process the chunk with the component (for non-source steps)
                 let (final_stream_id, final_metadata, final_chunk, final_chunk_index, final_is_final) =
@@ -1663,7 +1602,7 @@ async fn run_streaming_step_simple(
                     ).await;
 
                     match component_result {
-                        Ok(FlowResult::Success { result }) => {
+                        Ok(FlowResult::Success { result: _ }) => {
                             // For success results, forward the original chunk
                             (stream_id, metadata, chunk, chunk_index, is_final)
                         }
@@ -1760,7 +1699,7 @@ fn sort_streaming_steps_by_dependencies(
     use std::collections::{HashMap, HashSet, VecDeque};
 
     // Create a map of step ID to index for quick lookup
-    let step_id_to_index: HashMap<String, usize> = streaming_steps
+    let _step_id_to_index: HashMap<String, usize> = streaming_steps
         .iter()
         .map(|&idx| (flow.steps[idx].id.clone(), idx))
         .collect();
diff --git a/sdks/python/src/stepflow_sdk/audio_components.py b/sdks/python/src/stepflow_sdk/audio_components.py
index 5f7bd9a2..a712d793 100644
--- a/sdks/python/src/stepflow_sdk/audio_components.py
+++ b/sdks/python/src/stepflow_sdk/audio_components.py
@@ -16,7 +16,6 @@
 import queue
 import sys
 import numpy as np
-import datetime
 
 
 try:
@@ -154,11 +153,6 @@ def get_system_audio_chunk(self):
         )
 
 
-def log_debug(message, component="unknown"):
-    """Write debug message to stderr so it shows up in StepFlow logs."""
-    timestamp = datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-    sys.stderr.write(f"[{timestamp}] [{component}] {message}\n")
-    sys.stderr.flush()  # Ensure it is written immediately
 
 
 def audio_stream_source(data: Dict[str, Any], context=None):
@@ -420,8 +414,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
     Output:
         Processed chunk or analysis results
     """
-    import time
-    start_time = time.time()
     
     # Handle streaming chunk format - extract the actual chunk data
     if 'outcome' in data and data['outcome'] == 'streaming':
@@ -465,7 +457,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         amplified_data = b''.join(sample.to_bytes(2, 'little', signed=True) for sample in amplified_samples)
         amplified_b64 = base64.b64encode(amplified_data).decode('utf-8')
         
-        
         result = {
             "outcome": "streaming",
             "stream_id": stream_id,
@@ -488,7 +479,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
         else:
             max_amplitude = avg_amplitude = rms = 0
         
-        
         result = {
             "outcome": "success",
             "result": {
@@ -517,7 +507,6 @@ def audio_chunk_processor(data: Dict[str, Any], context=None) -> Dict[str, Any]:
             "output_file": output_file
         }
     
-    
     return result
 
 
@@ -535,8 +524,6 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
     Output:
         Confirmation of chunk received and file written
     """
-    import time
-    start_time = time.time()
     
     # Global storage for accumulating chunks across function calls
     if not hasattr(audio_sink, '_chunk_storage'):
@@ -612,7 +599,11 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
                 
                 
             except ImportError:
+                # sounddevice not available, skip audio playback
+                pass
             except Exception as e:
+                # Audio playback failed
+                pass
         
         # Write WAV file if this is the final chunk
         if is_final:
@@ -643,9 +634,12 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
                     del audio_sink._chunk_storage[stream_id]
                     
                 except Exception as e:
+                    # Error writing WAV file
                     import traceback
                     traceback.print_exc(file=sys.stderr)
             else:
+                # Stream not found in storage when final chunk received
+                pass
         
         result = {
             "outcome": "success",
@@ -672,5 +666,4 @@ def audio_sink(data: Dict[str, Any], context=None) -> Dict[str, Any]:
             }
         }
     
-    
     return result 
\ No newline at end of file