mz_persist_client/internal/
restore.rsuse crate::internal::encoding::UntypedState;
use crate::internal::paths::BlobKey;
use crate::internal::state::{BatchPart, RunPart, State};
use crate::internal::state_diff::{StateDiff, StateFieldValDiff};
use crate::internal::state_versions::StateVersions;
use crate::metrics::Metrics;
use crate::ShardId;
use anyhow::anyhow;
use mz_persist::location::Blob;
use timely::Container;
use tracing::info;
pub(crate) async fn restore_blob(
versions: &StateVersions,
blob: &dyn Blob,
build_version: &semver::Version,
shard_id: ShardId,
metrics: &Metrics,
) -> anyhow::Result<Vec<BlobKey>> {
let diffs = versions.fetch_all_live_diffs(&shard_id).await;
let Some(first_live_seqno) = diffs.0.first().map(|d| d.seqno) else {
info!("No diffs for shard {shard_id}.");
return Ok(vec![]);
};
fn after<A>(diff: StateFieldValDiff<A>) -> Option<A> {
match diff {
StateFieldValDiff::Insert(a) => Some(a),
StateFieldValDiff::Update(_, a) => Some(a),
StateFieldValDiff::Delete(_) => None,
}
}
let mut not_restored = vec![];
let mut check_restored = |key: &BlobKey, result: Result<(), _>| {
if result.is_err() {
not_restored.push(key.clone());
}
};
for diff in diffs.0 {
let mut diff: StateDiff<u64> = StateDiff::decode(build_version, diff.data);
let mut part_queue = vec![];
for rollup in std::mem::take(&mut diff.rollups) {
if rollup.key < first_live_seqno {
continue;
}
let Some(value) = after(rollup.val) else {
continue;
};
let key = value.key.complete(&shard_id);
let rollup_result = blob.restore(&key).await;
let rollup_restored = rollup_result.is_ok();
check_restored(&key, rollup_result);
if rollup.key != first_live_seqno || !rollup_restored {
continue;
}
let rollup_bytes = blob
.get(&key)
.await?
.ok_or_else(|| anyhow!("fetching just-restored rollup"))?;
let rollup_state: State<u64> =
UntypedState::decode(build_version, rollup_bytes).check_ts_codec(&shard_id)?;
for (seqno, rollup) in &rollup_state.collections.rollups {
if *seqno < first_live_seqno {
continue;
}
let key = rollup.key.complete(&shard_id);
check_restored(&key, blob.restore(&key).await);
}
for batch in rollup_state.collections.trace.batches() {
part_queue.extend(batch.parts.iter().cloned());
}
}
for diff in diff.referenced_batches() {
if let Some(after) = after(diff) {
part_queue.extend(after.parts.iter().cloned())
}
}
while let Some(part) = part_queue.pop() {
match part {
RunPart::Single(BatchPart::Inline { .. }) => {}
RunPart::Single(BatchPart::Hollow(part)) => {
let key = part.key.complete(&shard_id);
check_restored(&key, blob.restore(&key).await);
}
RunPart::Many(runs) => {
let key = runs.key.complete(&shard_id);
check_restored(&key, blob.restore(&key).await);
let runs = runs
.get(shard_id, blob, metrics)
.await
.ok_or_else(|| anyhow!("fetching just-restored run"))?;
part_queue.extend(runs.parts);
}
}
}
}
Ok(not_restored)
}