Struct mz_persist_client::iter::Consolidator

source ·

pub(crate) struct Consolidator<T, D, Sort: RowSort<T, D> = CodecSort<T, D>> {
    context: String,
    shard_id: ShardId,
    sort: Sort,
    blob: Arc<dyn Blob>,
    metrics: Arc<Metrics>,
    shard_metrics: Arc<ShardMetrics>,
    read_metrics: Arc<ReadMetrics>,
    runs: Vec<VecDeque<(ConsolidationPart<T, D, Sort>, usize)>>,
    filter: FetchBatchFilter<T>,
    budget: usize,
    drop_stash: Option<Sort::Updates>,
}

Expand description

A tool for incrementally consolidating a persist shard.

The naive way to consolidate a Persist shard would be to fetch every part, then consolidate the whole thing. We’d like to improve on that in two ways:

Concurrency: we’d like to be able to start consolidating and returning results before every part is fetched. (And continue fetching while we’re doing other work.)
Memory usage: we’d like to limit the number of parts we have in memory at once, dropping parts that are fully consolidated and fetching parts just a little before they’re needed.

This interface supports this by consolidating in multiple steps. Each call to Self::next will do some housekeeping work – prefetching needed parts, dropping any unneeded parts – and return an iterator over a consolidated subset of the data. To read an entire dataset, the client should call next until it returns None, which signals all data has been returned… but it’s also free to abandon the instance at any time if it eg. only needs a few entries.

Fields§

§context: String§shard_id: ShardId§sort: Sort§blob: Arc<dyn Blob>§metrics: Arc<Metrics>§shard_metrics: Arc<ShardMetrics>§read_metrics: Arc<ReadMetrics>§runs: Vec<VecDeque<(ConsolidationPart<T, D, Sort>, usize)>>§filter: FetchBatchFilter<T>§budget: usize§drop_stash: Option<Sort::Updates>

Struct mz_persist_client::iter::ConsolidatorCopy item path

Fields§

Implementations§

impl<T, D, Sort> Consolidator<T, D, Sort>where T: Timestamp + Codec64 + Lattice, D: Codec64 + Semigroup + Ord, Sort: RowSort<T, D>,

pub fn new( context: String, shard_id: ShardId, sort: Sort, blob: Arc<dyn Blob>, metrics: Arc<Metrics>, shard_metrics: Arc<ShardMetrics>, read_metrics: ReadMetrics, filter: FetchBatchFilter<T>, prefetch_budget_bytes: usize, ) -> Self

impl<T, D, Sort> Consolidator<T, D, Sort>where T: Timestamp + Codec64 + Lattice + Sync, D: Codec64 + Semigroup + Ord, Sort: RowSort<T, D>,

pub fn enqueue_run( &mut self, desc: &Description<T>, run_meta: &RunMeta, parts: impl IntoIterator<Item = RunPart<T>>, )

fn push_run(&mut self, run: VecDeque<(ConsolidationPart<T, D, Sort>, usize)>)

fn trim(&mut self)

fn iter(&mut self) -> Option<ConsolidatingIter<'_, T, D, Sort>>

async fn unblock_progress(&mut self) -> Result<()>

pub(crate) async fn next( &mut self, ) -> Result<Option<impl Iterator<Item = (Sort::KV<'_>, T, D)>>>

pub(crate) async fn next_chunk( &mut self, max_len: usize, max_bytes: usize, ) -> Result<Option<BlobTraceUpdates>>

fn live_bytes(&self) -> usize

pub(crate) fn start_prefetches(&mut self) -> Option<usize>

Trait Implementations§

impl<T: Debug, D: Debug, Sort: Debug + RowSort<T, D>> Debug for Consolidator<T, D, Sort>where Sort::Updates: Debug,

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<T, D, Sort: RowSort<T, D>> Drop for Consolidator<T, D, Sort>

fn drop(&mut self)

Auto Trait Implementations§

impl<T, D, Sort> Freeze for Consolidator<T, D, Sort>where Sort: Freeze, <Sort as RowSort<T, D>>::Updates: Freeze, T: Freeze,

impl<T, D, Sort = CodecSort<T, D>> !RefUnwindSafe for Consolidator<T, D, Sort>

impl<T, D, Sort> Send for Consolidator<T, D, Sort>where Sort: Send, <Sort as RowSort<T, D>>::Updates: Send, T: Send + Sync,

impl<T, D, Sort> Sync for Consolidator<T, D, Sort>where Sort: Sync, <Sort as RowSort<T, D>>::Updates: Sync, T: Sync + Send,

impl<T, D, Sort> Unpin for Consolidator<T, D, Sort>where Sort: Unpin, <Sort as RowSort<T, D>>::Updates: Unpin, T: Unpin,

impl<T, D, Sort = CodecSort<T, D>> !UnwindSafe for Consolidator<T, D, Sort>

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T, U> CastInto<U> for Twhere U: CastFrom<T>,

fn cast_into(self) -> U

impl<T> CopyAs<T> for T

fn copy_as(self) -> T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> FutureExt for T

fn with_context(self, otel_cx: Context) -> WithContext<Self>

fn with_current_context(self) -> WithContext<Self>

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoRequest<T> for T

fn into_request(self) -> Request<T>

impl<Unshared, Shared> IntoShared<Shared> for Unsharedwhere Shared: FromUnshared<Unshared>,

fn into_shared(self) -> Shared

impl<T> Pointable for T

const ALIGN: usize = _

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<P, R> ProtoType<R> for Pwhere R: RustType<P>,

fn into_rust(self) -> Result<R, TryFromProtoError>

fn from_rust(rust: &R) -> P

impl<T> Same for T

type Output = T

impl<'a, S, T> Semigroup<&'a S> for Twhere T: Semigroup<S>,

fn plus_equals(&mut self, rhs: &&'a S)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct mz_persist_client::iter::Consolidator

impl<T, D, Sort> Consolidator<T, D, Sort>
where T: Timestamp + Codec64 + Lattice, D: Codec64 + Semigroup + Ord, Sort: RowSort<T, D>,

impl<T, D, Sort> Consolidator<T, D, Sort>
where T: Timestamp + Codec64 + Lattice + Sync, D: Codec64 + Semigroup + Ord, Sort: RowSort<T, D>,

impl<T: Debug, D: Debug, Sort: Debug + RowSort<T, D>> Debug for Consolidator<T, D, Sort>
where Sort::Updates: Debug,

impl<T, D, Sort> Freeze for Consolidator<T, D, Sort>
where Sort: Freeze, <Sort as RowSort<T, D>>::Updates: Freeze, T: Freeze,

impl<T, D, Sort> Send for Consolidator<T, D, Sort>
where Sort: Send, <Sort as RowSort<T, D>>::Updates: Send, T: Send + Sync,

impl<T, D, Sort> Sync for Consolidator<T, D, Sort>
where Sort: Sync, <Sort as RowSort<T, D>>::Updates: Sync, T: Sync + Send,

impl<T, D, Sort> Unpin for Consolidator<T, D, Sort>
where Sort: Unpin, <Sort as RowSort<T, D>>::Updates: Unpin, T: Unpin,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> CastInto<U> for T
where U: CastFrom<T>,

impl<T, U> Into<U> for T
where U: From<T>,

impl<Unshared, Shared> IntoShared<Shared> for Unshared
where Shared: FromUnshared<Unshared>,

impl<P, R> ProtoType<R> for P
where R: RustType<P>,

impl<'a, S, T> Semigroup<&'a S> for T
where T: Semigroup<S>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,