datafusion_physical_plan::windows::bounded_window_agg_exec

Struct LinearSearch

pub struct LinearSearch {
    input_buffer_hashes: VecDeque<u64>,
    random_state: RandomState,
    ordered_partition_by_indices: Vec<usize>,
    row_map_batch: HashTable<(u64, usize)>,
    row_map_out: HashTable<(u64, usize, usize)>,
    input_schema: SchemaRef,
}

Expand description

This object encapsulates the algorithm state for a simple linear scan algorithm for computing partitions.

Fields§

§input_buffer_hashes: VecDeque<u64>

Keeps the hash of input buffer calculated from PARTITION BY columns. Its length is equal to the input_buffer length.

§random_state: RandomState

Used during hash value calculation.

§ordered_partition_by_indices: Vec<usize>

Input ordering and partition by key ordering need not be the same, so this vector stores the mapping between them. For instance, if the input is ordered by a, b and the window expression contains a PARTITION BY b, a clause, this attribute stores [1, 0].

§row_map_batch: HashTable<(u64, usize)>

We use this [HashTable] to calculate unique partitions for each new RecordBatch. First entry in the tuple is the hash value, the second entry is the unique ID for each partition (increments from 0 to n).

§row_map_out: HashTable<(u64, usize, usize)>

We use this [HashTable] to calculate the output columns that we can produce at each cycle. First entry in the tuple is the hash value, the second entry is the unique ID for each partition (increments from 0 to n). The third entry stores how many new outputs are calculated for the corresponding partition.

§input_schema: SchemaRef

Struct LinearSearch Copy item path

Fields§

Implementations§

impl LinearSearch

fn new( ordered_partition_by_indices: Vec<usize>, input_schema: SchemaRef, ) -> Self

fn get_per_partition_indices( &mut self, columns: &[ArrayRef], batch: &RecordBatch, ) -> Result<Vec<(PartitionKey, Vec<u32>)>>

fn calc_partition_output_indices( &mut self, input_buffer: &RecordBatch, window_agg_states: &[PartitionWindowAggStates], window_expr: &[Arc<dyn WindowExpr>], ) -> Result<Vec<(PartitionKey, Vec<u32>)>>

Trait Implementations§

impl PartitionSearcher for LinearSearch

fn calculate_out_columns( &mut self, input_buffer: &RecordBatch, window_agg_states: &[PartitionWindowAggStates], partition_buffers: &mut PartitionBatches, window_expr: &[Arc<dyn WindowExpr>], ) -> Result<Option<Vec<ArrayRef>>>

fn evaluate_partition_batches( &mut self, record_batch: &RecordBatch, window_expr: &[Arc<dyn WindowExpr>], ) -> Result<Vec<(PartitionKey, RecordBatch)>>

fn prune(&mut self, n_out: usize)

fn mark_partition_end(&self, partition_buffers: &mut PartitionBatches)

fn is_mode_linear(&self) -> bool

fn input_schema(&self) -> &SchemaRef

fn update_partition_batch( &mut self, input_buffer: &mut RecordBatch, record_batch: RecordBatch, window_expr: &[Arc<dyn WindowExpr>], partition_buffers: &mut PartitionBatches, ) -> Result<()>

Auto Trait Implementations§

impl Freeze for LinearSearch

impl RefUnwindSafe for LinearSearch

impl Send for LinearSearch

impl Sync for LinearSearch

impl Unpin for LinearSearch

impl UnwindSafe for LinearSearch

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<T> Allocation for Twhere T: RefUnwindSafe + Send + Sync,

impl<T> ErasedDestructor for Twhere T: 'static,

Struct LinearSearch

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

impl<T> Allocation for T
where T: RefUnwindSafe + Send + Sync,

impl<T> ErasedDestructor for T
where T: 'static,