[CHORE] Swordfish specific test fixtures (#3164)

This PR sets up a few swordfish related test fixtures, specifically: - Parameterize `default_morsel_size = [1, None]` for dataframe tests that do any into/repartitioning. This is to make sure that the operator parallelism is working. - Setup iteration tests in `test_iter.py` - Makes the ordering assertions stricter on some tests. E.g. some tests do `assert df.sort(col) == expected`, but there are other columns in df that may not be sorted, and this won't be enough if morsel_size = 1. This isn't a problem with swordfish but the test, where the sort should actually involve more columns. Big note: There was a problem with pivot not getting applied correctly. This is because a dataframe pivot operation comprises of an agg + the actual pivoting, but previously the pivot was implemented as an intermediate operator, and the results of the agg were getting buffered. In order for the pivot to work it has to receive all values with the same group_by keys. This PR implements simplifies Pivot as a BlockingSink, so all the work is in there. --------- Co-authored-by: Colin Ho <[email protected]>
Eventual-Inc · Nov 5, 2024 · 96c538b · 96c538b
1 parent 3cef614
commit 96c538b
Show file tree

Hide file tree

Showing 31 changed files with 391 additions and 302 deletions.
diff --git a/src/daft-local-execution/src/intermediate_ops/mod.rs b/src/daft-local-execution/src/intermediate_ops/mod.rs
@@ -5,7 +5,6 @@ pub mod explode;
 pub mod filter;
 pub mod inner_hash_join_probe;
 pub mod intermediate_op;
-pub mod pivot;
 pub mod project;
 pub mod sample;
 pub mod unpivot;
diff --git a/src/daft-local-execution/src/intermediate_ops/pivot.rs b/src/daft-local-execution/src/intermediate_ops/pivot.rs
diff --git a/src/daft-local-execution/src/pipeline.rs b/src/daft-local-execution/src/pipeline.rs
@@ -28,8 +28,8 @@ use crate::{
         actor_pool_project::ActorPoolProjectOperator, aggregate::AggregateOperator,
         anti_semi_hash_join_probe::AntiSemiProbeOperator, explode::ExplodeOperator,
         filter::FilterOperator, inner_hash_join_probe::InnerHashJoinProbeOperator,
-        intermediate_op::IntermediateNode, pivot::PivotOperator, project::ProjectOperator,
-        sample::SampleOperator, unpivot::UnpivotOperator,
+        intermediate_op::IntermediateNode, project::ProjectOperator, sample::SampleOperator,
+        unpivot::UnpivotOperator,
     },
     sinks::{
         aggregate::AggregateSink,
@@ -38,6 +38,7 @@ use crate::{
         hash_join_build::HashJoinBuildSink,
         limit::LimitSink,
         outer_hash_join_probe::OuterHashJoinProbeSink,
+        pivot::PivotSink,
         sort::SortSink,
         streaming_sink::StreamingSinkNode,
         write::{WriteFormat, WriteSink},
@@ -282,17 +283,19 @@ pub fn physical_plan_to_pipeline(
             group_by,
             pivot_column,
             value_column,
+            aggregation,
             names,
             ..
         }) => {
-            let pivot_op = PivotOperator::new(
+            let child_node = physical_plan_to_pipeline(input, psets, cfg)?;
+            let pivot_sink = PivotSink::new(
                 group_by.clone(),
                 pivot_column.clone(),
                 value_column.clone(),
+                aggregation.clone(),
                 names.clone(),
             );
-            let child_node = physical_plan_to_pipeline(input, psets, cfg)?;
-            IntermediateNode::new(Arc::new(pivot_op), vec![child_node]).boxed()
+            BlockingSinkNode::new(Arc::new(pivot_sink), child_node).boxed()
         }
         LocalPhysicalPlan::Sort(Sort {
             input,

diff --git a/src/daft-local-execution/src/sinks/mod.rs b/src/daft-local-execution/src/sinks/mod.rs
@@ -4,6 +4,7 @@ pub mod concat;
 pub mod hash_join_build;
 pub mod limit;
 pub mod outer_hash_join_probe;
+pub mod pivot;
 pub mod sort;
 pub mod streaming_sink;
 pub mod write;
diff --git a/src/daft-local-execution/src/sinks/pivot.rs b/src/daft-local-execution/src/sinks/pivot.rs
@@ -0,0 +1,126 @@
+use std::sync::Arc;
+
+use common_error::DaftResult;
+use daft_dsl::{AggExpr, Expr, ExprRef};
+use daft_micropartition::MicroPartition;
+use tracing::instrument;
+
+use super::blocking_sink::{BlockingSink, BlockingSinkState, BlockingSinkStatus};
+use crate::{pipeline::PipelineResultType, NUM_CPUS};
+
+enum PivotState {
+    Accumulating(Vec<Arc<MicroPartition>>),
+    Done,
+}
+
+impl PivotState {
+    fn push(&mut self, part: Arc<MicroPartition>) {
+        if let Self::Accumulating(ref mut parts) = self {
+            parts.push(part);
+        } else {
+            panic!("PivotSink should be in Accumulating state");
+        }
+    }
+
+    fn finalize(&mut self) -> Vec<Arc<MicroPartition>> {
+        let res = if let Self::Accumulating(ref mut parts) = self {
+            std::mem::take(parts)
+        } else {
+            panic!("PivotSink should be in Accumulating state");
+        };
+        *self = Self::Done;
+        res
+    }
+}
+
+impl BlockingSinkState for PivotState {
+    fn as_any_mut(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+}
+
+pub struct PivotSink {
+    pub group_by: Vec<ExprRef>,
+    pub pivot_column: ExprRef,
+    pub value_column: ExprRef,
+    pub aggregation: AggExpr,
+    pub names: Vec<String>,
+}
+
+impl PivotSink {
+    pub fn new(
+        group_by: Vec<ExprRef>,
+        pivot_column: ExprRef,
+        value_column: ExprRef,
+        aggregation: AggExpr,
+        names: Vec<String>,
+    ) -> Self {
+        Self {
+            group_by,
+            pivot_column,
+            value_column,
+            aggregation,
+            names,
+        }
+    }
+}
+
+impl BlockingSink for PivotSink {
+    #[instrument(skip_all, name = "PivotSink::sink")]
+    fn sink(
+        &self,
+        input: &Arc<MicroPartition>,
+        mut state: Box<dyn BlockingSinkState>,
+    ) -> DaftResult<BlockingSinkStatus> {
+        state
+            .as_any_mut()
+            .downcast_mut::<PivotState>()
+            .expect("PivotSink should have PivotState")
+            .push(input.clone());
+        Ok(BlockingSinkStatus::NeedMoreInput(state))
+    }
+
+    #[instrument(skip_all, name = "PivotSink::finalize")]
+    fn finalize(
+        &self,
+        states: Vec<Box<dyn BlockingSinkState>>,
+    ) -> DaftResult<Option<PipelineResultType>> {
+        let all_parts = states.into_iter().flat_map(|mut state| {
+            state
+                .as_any_mut()
+                .downcast_mut::<PivotState>()
+                .expect("PivotSink should have PivotState")
+                .finalize()
+        });
+        let concated = MicroPartition::concat(all_parts)?;
+        let group_by_with_pivot = self
+            .group_by
+            .iter()
+            .chain(std::iter::once(&self.pivot_column))
+            .cloned()
+            .collect::<Vec<_>>();
+        let agged = concated.agg(
+            &[Expr::Agg(self.aggregation.clone()).into()],
+            &group_by_with_pivot,
+        )?;
+        let pivoted = Arc::new(agged.pivot(
+            &self.group_by,
+            self.pivot_column.clone(),
+            self.value_column.clone(),
+            self.names.clone(),
+        )?);
+        Ok(Some(pivoted.into()))
+    }
+
+    fn name(&self) -> &'static str {
+        "PivotSink"
+    }
+
+    fn max_concurrency(&self) -> usize {
+        *NUM_CPUS
+    }
+
+    fn make_state(&self) -> DaftResult<Box<dyn BlockingSinkState>> {
+        Ok(Box::new(PivotState::Accumulating(vec![])))
+    }
+}
diff --git a/src/daft-physical-plan/src/local_plan.rs b/src/daft-physical-plan/src/local_plan.rs
@@ -205,6 +205,7 @@ impl LocalPhysicalPlan {
         group_by: Vec<ExprRef>,
         pivot_column: ExprRef,
         value_column: ExprRef,
+        aggregation: AggExpr,
         names: Vec<String>,
         schema: SchemaRef,
     ) -> LocalPhysicalPlanRef {
@@ -213,6 +214,7 @@ impl LocalPhysicalPlan {
             group_by,
             pivot_column,
             value_column,
+            aggregation,
             names,
             schema,
             plan_stats: PlanStats {},
@@ -438,6 +440,7 @@ pub struct Pivot {
     pub group_by: Vec<ExprRef>,
     pub pivot_column: ExprRef,
     pub value_column: ExprRef,
+    pub aggregation: AggExpr,
     pub names: Vec<String>,
     pub schema: SchemaRef,
     pub plan_stats: PlanStats,

diff --git a/src/daft-physical-plan/src/translate.rs b/src/daft-physical-plan/src/translate.rs
@@ -1,5 +1,5 @@
 use common_error::{DaftError, DaftResult};
-use daft_core::{join::JoinStrategy, prelude::Schema};
+use daft_core::join::JoinStrategy;
 use daft_dsl::ExprRef;
 use daft_plan::{JoinType, LogicalPlan, LogicalPlanRef, SourceInfo};
 
@@ -91,29 +91,12 @@ pub fn translate(plan: &LogicalPlanRef) -> DaftResult<LocalPhysicalPlanRef> {
         }
         LogicalPlan::Pivot(pivot) => {
             let input = translate(&pivot.input)?;
-            let groupby_with_pivot = pivot
-                .group_by
-                .iter()
-                .chain(std::iter::once(&pivot.pivot_column))
-                .cloned()
-                .collect::<Vec<_>>();
-            let aggregate_fields = groupby_with_pivot
-                .iter()
-                .map(|expr| expr.to_field(input.schema()))
-                .chain(std::iter::once(pivot.aggregation.to_field(input.schema())))
-                .collect::<DaftResult<Vec<_>>>()?;
-            let aggregate_schema = Schema::new(aggregate_fields)?;
-            let aggregate = LocalPhysicalPlan::hash_aggregate(
-                input,
-                vec![pivot.aggregation.clone(); 1],
-                groupby_with_pivot,
-                aggregate_schema.into(),
-            );
             Ok(LocalPhysicalPlan::pivot(
-                aggregate,
+                input,
                 pivot.group_by.clone(),
                 pivot.pivot_column.clone(),
                 pivot.value_column.clone(),
+                pivot.aggregation.clone(),
                 pivot.names.clone(),
                 pivot.output_schema.clone(),
             ))

diff --git a/tests/conftest.py b/tests/conftest.py
@@ -7,6 +7,7 @@
 import pytest
 
 import daft
+import daft.context
 from daft.table import MicroPartition
 
 # import all conftest
@@ -170,3 +171,13 @@ def assert_df_equals(
         except AssertionError:
             print(f"Failed assertion for col: {col}")
             raise
+
+
+@pytest.fixture(
+    scope="function",
+    params=[1, None] if daft.context.get_context().daft_execution_config.enable_native_executor else [None],
+)
+def with_morsel_size(request):
+    morsel_size = request.param
+    with daft.context.execution_config_ctx(default_morsel_size=morsel_size):
+        yield morsel_size
diff --git a/tests/cookbook/conftest.py b/tests/cookbook/conftest.py
@@ -42,7 +42,10 @@ def service_requests_csv_pd_df():
     return pd.read_csv(COOKBOOK_DATA_CSV, keep_default_na=False)[COLUMNS]
 
 
-@pytest.fixture(scope="module", params=[1, 2])
+@pytest.fixture(
+    scope="module",
+    params=[1, 2] if daft.context.get_context().daft_execution_config.enable_native_executor is False else [1],
+)
 def repartition_nparts(request):
     """Adds a `n_repartitions` parameter to test cases which provides the number of
     partitions that the test case should repartition its dataset into for testing