From ffc55386f3ad49749894f9c09c61c7cf9dcd6da9 Mon Sep 17 00:00:00 2001 From: Orson Peters Date: Wed, 25 Dec 2024 08:01:15 +0100 Subject: [PATCH] perf: Re-enable common subplan elim for new-streaming engine (#20443) --- crates/polars-lazy/src/frame/mod.rs | 4 ---- .../src/physical_plan/lower_ir.rs | 19 ++++++++++++++++++- crates/polars-stream/src/physical_plan/mod.rs | 2 ++ .../tests/unit/lazyframe/test_lazyframe.py | 1 + 4 files changed, 21 insertions(+), 5 deletions(-) diff --git a/crates/polars-lazy/src/frame/mod.rs b/crates/polars-lazy/src/frame/mod.rs index 535a557b0c02..ab1f1bc1835c 100644 --- a/crates/polars-lazy/src/frame/mod.rs +++ b/crates/polars-lazy/src/frame/mod.rs @@ -619,10 +619,6 @@ impl LazyFrame { // The new streaming engine can't deal with the way the common // subexpression elimination adds length-incorrect with_columns. opt_state &= !OptFlags::COMM_SUBEXPR_ELIM; - - // The new streaming engine can't yet deal with the cache nodes - // introduced by common subplan elimination. - opt_state &= !OptFlags::COMM_SUBPLAN_ELIM; } let lp_top = optimize( diff --git a/crates/polars-stream/src/physical_plan/lower_ir.rs b/crates/polars-stream/src/physical_plan/lower_ir.rs index bad63a0e767b..05cdd8864b80 100644 --- a/crates/polars-stream/src/physical_plan/lower_ir.rs +++ b/crates/polars-stream/src/physical_plan/lower_ir.rs @@ -86,6 +86,7 @@ pub fn lower_ir( phys_sm: &mut SlotMap, schema_cache: &mut PlHashMap>, expr_cache: &mut ExprCache, + cache_nodes: &mut PlHashMap, ) -> PolarsResult { // Helper macro to simplify recursive calls. macro_rules! lower_ir { @@ -97,6 +98,7 @@ pub fn lower_ir( phys_sm, schema_cache, expr_cache, + cache_nodes, ) }; } @@ -431,7 +433,22 @@ pub fn lower_ir( #[cfg(feature = "python")] IR::PythonScan { .. } => todo!(), - IR::Cache { .. } => todo!(), + + IR::Cache { + input, + id, + cache_hits: _, + } => { + let id = *id; + if let Some(cached) = cache_nodes.get(&id) { + return Ok(*cached); + } + + let phys_input = lower_ir!(*input)?; + cache_nodes.insert(id, phys_input); + return Ok(phys_input); + }, + IR::GroupBy { input, keys, diff --git a/crates/polars-stream/src/physical_plan/mod.rs b/crates/polars-stream/src/physical_plan/mod.rs index c5f679c7fe56..217131b18b03 100644 --- a/crates/polars-stream/src/physical_plan/mod.rs +++ b/crates/polars-stream/src/physical_plan/mod.rs @@ -253,6 +253,7 @@ pub fn build_physical_plan( ) -> PolarsResult { let mut schema_cache = PlHashMap::with_capacity(ir_arena.len()); let mut expr_cache = ExprCache::with_capacity(expr_arena.len()); + let mut cache_nodes = PlHashMap::new(); let phys_root = lower_ir::lower_ir( root, ir_arena, @@ -260,6 +261,7 @@ pub fn build_physical_plan( phys_sm, &mut schema_cache, &mut expr_cache, + &mut cache_nodes, )?; let mut referenced = SecondaryMap::with_capacity(phys_sm.capacity()); insert_multiplexers(phys_root, phys_sm, &mut referenced); diff --git a/py-polars/tests/unit/lazyframe/test_lazyframe.py b/py-polars/tests/unit/lazyframe/test_lazyframe.py index 4aafc9d523ee..5ef0b65deba8 100644 --- a/py-polars/tests/unit/lazyframe/test_lazyframe.py +++ b/py-polars/tests/unit/lazyframe/test_lazyframe.py @@ -1124,6 +1124,7 @@ def test_lazy_cache_same_key() -> None: assert_frame_equal(result, expected) +@pytest.mark.may_fail_auto_streaming def test_lazy_cache_hit(monkeypatch: Any, capfd: Any) -> None: monkeypatch.setenv("POLARS_VERBOSE", "1")