From d27f7b234e0f5898853689e53c9d8c315ecbf116 Mon Sep 17 00:00:00 2001 From: Orson Peters Date: Tue, 24 Dec 2024 16:13:08 +0100 Subject: [PATCH] perf: Don't collect all LHS arrays in gather (#20441) --- .../src/chunked_array/gather/chunked.rs | 25 ++++++++----------- 1 file changed, 11 insertions(+), 14 deletions(-) diff --git a/crates/polars-ops/src/chunked_array/gather/chunked.rs b/crates/polars-ops/src/chunked_array/gather/chunked.rs index 44c03f09d2c3..58ceafea92c9 100644 --- a/crates/polars-ops/src/chunked_array/gather/chunked.rs +++ b/crates/polars-ops/src/chunked_array/gather/chunked.rs @@ -321,31 +321,30 @@ where ) -> Self { let arrow_dtype = self.dtype().to_arrow(CompatLevel::newest()); - let mut out = if let Some(iter) = self.downcast_slices() { - let targets = iter.collect::>(); + let mut out = if !self.has_nulls() { let iter = by.iter().map(|chunk_id| { debug_assert!( !chunk_id.is_null(), "null chunks should not hit this branch" ); let (chunk_idx, array_idx) = chunk_id.extract(); - let vals = targets.get_unchecked(chunk_idx as usize); - vals.get_unchecked(array_idx as usize).clone() + let arr = self.downcast_get_unchecked(chunk_idx as usize); + arr.value_unchecked(array_idx as usize).clone() }); let arr = iter.collect_arr_trusted_with_dtype(arrow_dtype); ChunkedArray::with_chunk(self.name().clone(), arr) } else { - let targets = self.downcast_iter().collect::>(); let iter = by.iter().map(|chunk_id| { debug_assert!( !chunk_id.is_null(), "null chunks should not hit this branch" ); let (chunk_idx, array_idx) = chunk_id.extract(); - let vals = targets.get_unchecked(chunk_idx as usize); - vals.get_unchecked(array_idx as usize) + let arr = self.downcast_get_unchecked(chunk_idx as usize); + arr.get_unchecked(array_idx as usize) }); + let arr = iter.collect_arr_trusted_with_dtype(arrow_dtype); ChunkedArray::with_chunk(self.name().clone(), arr) }; @@ -358,8 +357,7 @@ where unsafe fn take_opt_chunked_unchecked(&self, by: &[ChunkId]) -> Self { let arrow_dtype = self.dtype().to_arrow(CompatLevel::newest()); - if let Some(iter) = self.downcast_slices() { - let targets = iter.collect::>(); + if !self.has_nulls() { let arr = by .iter() .map(|chunk_id| { @@ -367,15 +365,14 @@ where None } else { let (chunk_idx, array_idx) = chunk_id.extract(); - let vals = *targets.get_unchecked(chunk_idx as usize); - Some(vals.get_unchecked(array_idx as usize).clone()) + let arr = self.downcast_get_unchecked(chunk_idx as usize); + Some(arr.value_unchecked(array_idx as usize).clone()) } }) .collect_arr_trusted_with_dtype(arrow_dtype); ChunkedArray::with_chunk(self.name().clone(), arr) } else { - let targets = self.downcast_iter().collect::>(); let arr = by .iter() .map(|chunk_id| { @@ -383,8 +380,8 @@ where None } else { let (chunk_idx, array_idx) = chunk_id.extract(); - let vals = *targets.get_unchecked(chunk_idx as usize); - vals.get_unchecked(array_idx as usize) + let arr = self.downcast_get_unchecked(chunk_idx as usize); + arr.get_unchecked(array_idx as usize) } }) .collect_arr_trusted_with_dtype(arrow_dtype);