1use itertools::Itertools;
34use proptest_derive::Arbitrary;
35use serde::{Deserialize, Serialize};
36use std::borrow::Cow;
37use std::collections::{BTreeMap, BTreeSet};
38use std::fmt;
39use std::fmt::{Display, Formatter};
40
41use mz_ore::stack::RecursionLimitError;
42use mz_ore::str::{Indent, bracketed, separated};
43
44use crate::explain::dot::{DisplayDot, dot_string};
45use crate::explain::json::{DisplayJson, json_string};
46use crate::explain::text::{DisplayText, text_string};
47use crate::optimize::OptimizerFeatureOverrides;
48use crate::{GlobalId, ReprColumnType, ReprScalarType, SqlColumnType, SqlScalarType};
49
50pub mod dot;
51pub mod json;
52pub mod text;
53#[cfg(feature = "tracing")]
54pub mod tracing;
55
56#[cfg(feature = "tracing")]
57pub use crate::explain::tracing::trace_plan;
58
59#[derive(Debug, Clone, Copy, Eq, PartialEq)]
61pub enum ExplainFormat {
62 Text,
63 Json,
64 Dot,
65}
66
67impl fmt::Display for ExplainFormat {
68 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
69 match self {
70 ExplainFormat::Text => f.write_str("TEXT"),
71 ExplainFormat::Json => f.write_str("JSON"),
72 ExplainFormat::Dot => f.write_str("DOT"),
73 }
74 }
75}
76
77#[allow(missing_debug_implementations)]
81pub enum UnsupportedFormat {}
82
83#[derive(Debug)]
86pub enum ExplainError {
87 UnsupportedFormat(ExplainFormat),
88 FormatError(fmt::Error),
89 AnyhowError(anyhow::Error),
90 RecursionLimitError(RecursionLimitError),
91 SerdeJsonError(serde_json::Error),
92 LinearChainsPlusRecursive,
93 UnknownError(String),
94}
95
96impl fmt::Display for ExplainError {
97 fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
98 write!(f, "error while rendering explain output: ")?;
99 match self {
100 ExplainError::UnsupportedFormat(format) => {
101 write!(f, "{} format is not supported", format)
102 }
103 ExplainError::FormatError(error) => {
104 write!(f, "{}", error)
105 }
106 ExplainError::AnyhowError(error) => {
107 write!(f, "{}", error)
108 }
109 ExplainError::RecursionLimitError(error) => {
110 write!(f, "{}", error)
111 }
112 ExplainError::SerdeJsonError(error) => {
113 write!(f, "{}", error)
114 }
115 ExplainError::LinearChainsPlusRecursive => {
116 write!(
117 f,
118 "The linear_chains option is not supported with WITH MUTUALLY RECURSIVE."
119 )
120 }
121 ExplainError::UnknownError(error) => {
122 write!(f, "{}", error)
123 }
124 }
125 }
126}
127
128impl From<fmt::Error> for ExplainError {
129 fn from(error: fmt::Error) -> Self {
130 ExplainError::FormatError(error)
131 }
132}
133
134impl From<anyhow::Error> for ExplainError {
135 fn from(error: anyhow::Error) -> Self {
136 ExplainError::AnyhowError(error)
137 }
138}
139
140impl From<RecursionLimitError> for ExplainError {
141 fn from(error: RecursionLimitError) -> Self {
142 ExplainError::RecursionLimitError(error)
143 }
144}
145
146impl From<serde_json::Error> for ExplainError {
147 fn from(error: serde_json::Error) -> Self {
148 ExplainError::SerdeJsonError(error)
149 }
150}
151
152#[derive(Clone, Debug)]
154pub struct ExplainConfig {
155 pub subtree_size: bool,
159 pub arity: bool,
161 pub types: bool,
163 pub keys: bool,
165 pub non_negative: bool,
167 pub cardinality: bool,
169 pub column_names: bool,
171 pub equivalences: bool,
173 pub join_impls: bool,
179 pub humanized_exprs: bool,
181 pub linear_chains: bool,
183 pub no_fast_path: bool,
186 pub no_notices: bool,
188 pub node_ids: bool,
190 pub raw_plans: bool,
192 pub raw_syntax: bool,
194 pub verbose_syntax: bool,
196 pub redacted: bool,
198 pub timing: bool,
200 pub filter_pushdown: bool,
202
203 pub features: OptimizerFeatureOverrides,
205}
206
207impl Default for ExplainConfig {
208 fn default() -> Self {
209 Self {
210 redacted: !mz_ore::assert::soft_assertions_enabled(),
212 arity: false,
213 cardinality: false,
214 column_names: false,
215 filter_pushdown: false,
216 humanized_exprs: false,
217 join_impls: true,
218 keys: false,
219 linear_chains: false,
220 no_fast_path: true,
221 no_notices: false,
222 node_ids: false,
223 non_negative: false,
224 raw_plans: true,
225 raw_syntax: false,
226 verbose_syntax: false,
227 subtree_size: false,
228 timing: false,
229 types: false,
230 equivalences: false,
231 features: Default::default(),
232 }
233 }
234}
235
236impl ExplainConfig {
237 pub fn requires_analyses(&self) -> bool {
238 self.subtree_size
239 || self.non_negative
240 || self.arity
241 || self.types
242 || self.keys
243 || self.cardinality
244 || self.column_names
245 || self.equivalences
246 }
247}
248
249#[derive(Clone, Debug)]
251pub enum Explainee {
252 MaterializedView(GlobalId),
254 Index(GlobalId),
256 Dataflow(GlobalId),
260 Select,
263}
264
265pub trait Explain<'a>: 'a {
271 type Context;
274
275 type Text: DisplayText;
278
279 type Json: DisplayJson;
282
283 type Dot: DisplayDot;
286
287 fn explain(
302 &'a mut self,
303 format: &'a ExplainFormat,
304 context: &'a Self::Context,
305 ) -> Result<String, ExplainError> {
306 match format {
307 ExplainFormat::Text => self.explain_text(context).map(|e| text_string(&e)),
308 ExplainFormat::Json => self.explain_json(context).map(|e| json_string(&e)),
309 ExplainFormat::Dot => self.explain_dot(context).map(|e| dot_string(&e)),
310 }
311 }
312
313 #[allow(unused_variables)]
325 fn explain_text(&'a mut self, context: &'a Self::Context) -> Result<Self::Text, ExplainError> {
326 Err(ExplainError::UnsupportedFormat(ExplainFormat::Text))
327 }
328
329 #[allow(unused_variables)]
341 fn explain_json(&'a mut self, context: &'a Self::Context) -> Result<Self::Json, ExplainError> {
342 Err(ExplainError::UnsupportedFormat(ExplainFormat::Json))
343 }
344
345 #[allow(unused_variables)]
357 fn explain_dot(&'a mut self, context: &'a Self::Context) -> Result<Self::Dot, ExplainError> {
358 Err(ExplainError::UnsupportedFormat(ExplainFormat::Dot))
359 }
360}
361
362#[derive(Debug)]
366pub struct RenderingContext<'a> {
367 pub indent: Indent,
368 pub humanizer: &'a dyn ExprHumanizer,
369}
370
371impl<'a> RenderingContext<'a> {
372 pub fn new(indent: Indent, humanizer: &'a dyn ExprHumanizer) -> RenderingContext<'a> {
373 RenderingContext { indent, humanizer }
374 }
375}
376
377impl<'a> AsMut<Indent> for RenderingContext<'a> {
378 fn as_mut(&mut self) -> &mut Indent {
379 &mut self.indent
380 }
381}
382
383impl<'a> AsRef<&'a dyn ExprHumanizer> for RenderingContext<'a> {
384 fn as_ref(&self) -> &&'a dyn ExprHumanizer {
385 &self.humanizer
386 }
387}
388
389#[allow(missing_debug_implementations)]
390pub struct PlanRenderingContext<'a, T> {
391 pub indent: Indent,
392 pub humanizer: &'a dyn ExprHumanizer,
393 pub annotations: BTreeMap<&'a T, Analyses>,
394 pub config: &'a ExplainConfig,
395}
396
397impl<'a, T> PlanRenderingContext<'a, T> {
398 pub fn new(
399 indent: Indent,
400 humanizer: &'a dyn ExprHumanizer,
401 annotations: BTreeMap<&'a T, Analyses>,
402 config: &'a ExplainConfig,
403 ) -> PlanRenderingContext<'a, T> {
404 PlanRenderingContext {
405 indent,
406 humanizer,
407 annotations,
408 config,
409 }
410 }
411}
412
413impl<'a, T> AsMut<Indent> for PlanRenderingContext<'a, T> {
414 fn as_mut(&mut self) -> &mut Indent {
415 &mut self.indent
416 }
417}
418
419impl<'a, T> AsRef<&'a dyn ExprHumanizer> for PlanRenderingContext<'a, T> {
420 fn as_ref(&self) -> &&'a dyn ExprHumanizer {
421 &self.humanizer
422 }
423}
424
425pub trait ExprHumanizer: fmt::Debug {
430 fn humanize_id(&self, id: GlobalId) -> Option<String>;
433
434 fn humanize_id_unqualified(&self, id: GlobalId) -> Option<String>;
436
437 fn humanize_id_parts(&self, id: GlobalId) -> Option<Vec<String>>;
440
441 fn humanize_scalar_type(&self, ty: &SqlScalarType, postgres_compat: bool) -> String;
446
447 fn humanize_scalar_type_repr(&self, typ: &ReprScalarType, postgres_compat: bool) -> String {
450 self.humanize_scalar_type(&SqlScalarType::from_repr(typ), postgres_compat)
451 }
452
453 fn humanize_column_type(&self, typ: &SqlColumnType, postgres_compat: bool) -> String {
458 format!(
459 "{}{}",
460 self.humanize_scalar_type(&typ.scalar_type, postgres_compat),
461 if typ.nullable { "?" } else { "" }
462 )
463 }
464
465 fn humanize_column_type_repr(&self, typ: &ReprColumnType, postgres_compat: bool) -> String {
468 self.humanize_column_type(&SqlColumnType::from_repr(typ), postgres_compat)
469 }
470
471 fn column_names_for_id(&self, id: GlobalId) -> Option<Vec<String>>;
473
474 fn humanize_column(&self, id: GlobalId, column: usize) -> Option<String>;
476
477 fn id_exists(&self, id: GlobalId) -> bool;
479}
480
481#[derive(Debug)]
484pub struct ExprHumanizerExt<'a> {
485 items: BTreeMap<GlobalId, TransientItem>,
488 inner: &'a dyn ExprHumanizer,
491}
492
493impl<'a> ExprHumanizerExt<'a> {
494 pub fn new(items: BTreeMap<GlobalId, TransientItem>, inner: &'a dyn ExprHumanizer) -> Self {
495 Self { items, inner }
496 }
497}
498
499impl<'a> ExprHumanizer for ExprHumanizerExt<'a> {
500 fn humanize_id(&self, id: GlobalId) -> Option<String> {
501 match self.items.get(&id) {
502 Some(item) => item
503 .humanized_id_parts
504 .as_ref()
505 .map(|parts| parts.join(".")),
506 None => self.inner.humanize_id(id),
507 }
508 }
509
510 fn humanize_id_unqualified(&self, id: GlobalId) -> Option<String> {
511 match self.items.get(&id) {
512 Some(item) => item
513 .humanized_id_parts
514 .as_ref()
515 .and_then(|parts| parts.last().cloned()),
516 None => self.inner.humanize_id_unqualified(id),
517 }
518 }
519
520 fn humanize_id_parts(&self, id: GlobalId) -> Option<Vec<String>> {
521 match self.items.get(&id) {
522 Some(item) => item.humanized_id_parts.clone(),
523 None => self.inner.humanize_id_parts(id),
524 }
525 }
526
527 fn humanize_scalar_type(&self, ty: &SqlScalarType, postgres_compat: bool) -> String {
528 self.inner.humanize_scalar_type(ty, postgres_compat)
529 }
530
531 fn column_names_for_id(&self, id: GlobalId) -> Option<Vec<String>> {
532 match self.items.get(&id) {
533 Some(item) => item.column_names.clone(),
534 None => self.inner.column_names_for_id(id),
535 }
536 }
537
538 fn humanize_column(&self, id: GlobalId, column: usize) -> Option<String> {
539 match self.items.get(&id) {
540 Some(item) => match &item.column_names {
541 Some(column_names) => Some(column_names[column].clone()),
542 None => None,
543 },
544 None => self.inner.humanize_column(id, column),
545 }
546 }
547
548 fn id_exists(&self, id: GlobalId) -> bool {
549 self.items.contains_key(&id) || self.inner.id_exists(id)
550 }
551}
552
553#[derive(Debug)]
557pub struct TransientItem {
558 humanized_id_parts: Option<Vec<String>>,
559 column_names: Option<Vec<String>>,
560}
561
562impl TransientItem {
563 pub fn new(humanized_id_parts: Option<Vec<String>>, column_names: Option<Vec<String>>) -> Self {
564 Self {
565 humanized_id_parts,
566 column_names,
567 }
568 }
569}
570
571#[derive(Debug)]
577pub struct DummyHumanizer;
578
579impl ExprHumanizer for DummyHumanizer {
580 fn humanize_id(&self, _: GlobalId) -> Option<String> {
581 None
584 }
585
586 fn humanize_id_unqualified(&self, _id: GlobalId) -> Option<String> {
587 None
588 }
589
590 fn humanize_id_parts(&self, _id: GlobalId) -> Option<Vec<String>> {
591 None
592 }
593
594 fn humanize_scalar_type(&self, ty: &SqlScalarType, _postgres_compat: bool) -> String {
595 format!("{:?}", ty)
597 }
598
599 fn column_names_for_id(&self, _id: GlobalId) -> Option<Vec<String>> {
600 None
601 }
602
603 fn humanize_column(&self, _id: GlobalId, _column: usize) -> Option<String> {
604 None
605 }
606
607 fn id_exists(&self, _id: GlobalId) -> bool {
608 false
609 }
610}
611
612#[derive(Debug)]
614pub struct Indices<'a>(pub &'a [usize]);
615
616#[derive(Debug)]
621pub struct CompactScalarSeq<'a, T: ScalarOps>(pub &'a [T]); #[derive(Debug)]
628pub struct CompactScalars<T, I>(pub I)
629where
630 T: ScalarOps,
631 I: Iterator<Item = T> + Clone;
632
633pub trait ScalarOps {
634 fn match_col_ref(&self) -> Option<usize>;
635
636 fn references(&self, col_ref: usize) -> bool;
637}
638
639#[allow(missing_debug_implementations)]
642pub struct AnnotatedPlan<'a, T> {
643 pub plan: &'a T,
644 pub annotations: BTreeMap<&'a T, Analyses>,
645}
646
647#[derive(Clone, Default, Debug)]
649pub struct Analyses {
650 pub non_negative: Option<bool>,
651 pub subtree_size: Option<usize>,
652 pub arity: Option<usize>,
653 pub types: Option<Option<Vec<SqlColumnType>>>,
654 pub keys: Option<Vec<Vec<usize>>>,
655 pub cardinality: Option<String>,
656 pub column_names: Option<Vec<String>>,
657 pub equivalences: Option<String>,
658}
659
660#[derive(Debug, Clone)]
661pub struct HumanizedAnalyses<'a> {
662 analyses: &'a Analyses,
663 humanizer: &'a dyn ExprHumanizer,
664 config: &'a ExplainConfig,
665}
666
667impl<'a> HumanizedAnalyses<'a> {
668 pub fn new<T>(analyses: &'a Analyses, ctx: &PlanRenderingContext<'a, T>) -> Self {
669 Self {
670 analyses,
671 humanizer: ctx.humanizer,
672 config: ctx.config,
673 }
674 }
675}
676
677impl<'a> Display for HumanizedAnalyses<'a> {
678 fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
683 let mut builder = f.debug_struct("//");
684
685 if self.config.subtree_size {
686 let subtree_size = self.analyses.subtree_size.expect("subtree_size");
687 builder.field("subtree_size", &subtree_size);
688 }
689
690 if self.config.non_negative {
691 let non_negative = self.analyses.non_negative.expect("non_negative");
692 builder.field("non_negative", &non_negative);
693 }
694
695 if self.config.arity {
696 let arity = self.analyses.arity.expect("arity");
697 builder.field("arity", &arity);
698 }
699
700 if self.config.types {
701 let types = match self.analyses.types.as_ref().expect("types") {
702 Some(types) => {
703 let types = types
704 .into_iter()
705 .map(|c| self.humanizer.humanize_column_type(c, false))
706 .collect::<Vec<_>>();
707
708 bracketed("(", ")", separated(", ", types)).to_string()
709 }
710 None => "(<error>)".to_string(),
711 };
712 builder.field("types", &types);
713 }
714
715 if self.config.keys {
716 let keys = self
717 .analyses
718 .keys
719 .as_ref()
720 .expect("keys")
721 .into_iter()
722 .map(|key| bracketed("[", "]", separated(", ", key)).to_string());
723 let keys = bracketed("(", ")", separated(", ", keys)).to_string();
724 builder.field("keys", &keys);
725 }
726
727 if self.config.cardinality {
728 let cardinality = self.analyses.cardinality.as_ref().expect("cardinality");
729 builder.field("cardinality", cardinality);
730 }
731
732 if self.config.column_names {
733 let column_names = self.analyses.column_names.as_ref().expect("column_names");
734 let column_names = column_names.into_iter().enumerate().map(|(i, c)| {
735 if c.is_empty() {
736 Cow::Owned(format!("#{i}"))
737 } else {
738 Cow::Borrowed(c)
739 }
740 });
741 let column_names = bracketed("(", ")", separated(", ", column_names)).to_string();
742 builder.field("column_names", &column_names);
743 }
744
745 if self.config.equivalences {
746 let equivs = self.analyses.equivalences.as_ref().expect("equivalences");
747 builder.field("equivs", equivs);
748 }
749
750 builder.finish()
751 }
752}
753
754#[derive(Clone, Debug, Default)]
763pub struct UsedIndexes(BTreeSet<(GlobalId, Vec<IndexUsageType>)>);
764
765impl UsedIndexes {
766 pub fn new(values: BTreeSet<(GlobalId, Vec<IndexUsageType>)>) -> UsedIndexes {
767 UsedIndexes(values)
768 }
769
770 pub fn is_empty(&self) -> bool {
771 self.0.is_empty()
772 }
773}
774
775#[derive(Debug, Clone, Arbitrary, Serialize, Deserialize, Eq, PartialEq, Ord, PartialOrd, Hash)]
776pub enum IndexUsageType {
777 FullScan,
779 DifferentialJoin,
781 DeltaJoin(DeltaJoinIndexUsageType),
783 Lookup(GlobalId),
788 PlanRootNoArrangement,
794 SinkExport,
797 IndexExport,
800 FastPathLimit,
805 DanglingArrangeBy,
811 Unknown,
814}
815
816#[derive(Debug, Clone, Arbitrary, Serialize, Deserialize, Eq, PartialEq, Ord, PartialOrd, Hash)]
820pub enum DeltaJoinIndexUsageType {
821 Unknown,
822 Lookup,
823 FirstInputFullScan,
824}
825
826impl std::fmt::Display for IndexUsageType {
827 fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
828 write!(
829 f,
830 "{}",
831 match self {
832 IndexUsageType::FullScan => "*** full scan ***",
833 IndexUsageType::Lookup(_idx_id) => "lookup",
834 IndexUsageType::DifferentialJoin => "differential join",
835 IndexUsageType::DeltaJoin(DeltaJoinIndexUsageType::FirstInputFullScan) =>
836 "delta join 1st input (full scan)",
837 IndexUsageType::DeltaJoin(DeltaJoinIndexUsageType::Lookup) => "delta join lookup",
844 IndexUsageType::DeltaJoin(DeltaJoinIndexUsageType::Unknown) =>
845 "*** INTERNAL ERROR (unknown delta join usage) ***",
846 IndexUsageType::PlanRootNoArrangement => "plan root (no new arrangement)",
847 IndexUsageType::SinkExport => "sink export",
848 IndexUsageType::IndexExport => "index export",
849 IndexUsageType::FastPathLimit => "fast path limit",
850 IndexUsageType::DanglingArrangeBy => "*** INTERNAL ERROR (dangling ArrangeBy) ***",
851 IndexUsageType::Unknown => "*** INTERNAL ERROR (unknown usage) ***",
852 }
853 )
854 }
855}
856
857impl IndexUsageType {
858 pub fn display_vec<'a, I>(usage_types: I) -> impl Display + Sized + 'a
859 where
860 I: IntoIterator<Item = &'a IndexUsageType>,
861 {
862 separated(", ", usage_types.into_iter().sorted().dedup())
863 }
864}
865
866#[cfg(test)]
867mod tests {
868 use mz_ore::assert_ok;
869
870 use super::*;
871
872 struct Environment {
873 name: String,
874 }
875
876 impl Default for Environment {
877 fn default() -> Self {
878 Environment {
879 name: "test env".to_string(),
880 }
881 }
882 }
883
884 struct Frontiers<T> {
885 since: T,
886 upper: T,
887 }
888
889 impl<T> Frontiers<T> {
890 fn new(since: T, upper: T) -> Self {
891 Self { since, upper }
892 }
893 }
894
895 struct ExplainContext<'a> {
896 env: &'a mut Environment,
897 config: &'a ExplainConfig,
898 frontiers: Frontiers<u64>,
899 }
900
901 struct TestExpr {
903 lhs: i32,
904 rhs: i32,
905 }
906
907 struct TestExplanation<'a> {
908 expr: &'a TestExpr,
909 context: &'a ExplainContext<'a>,
910 }
911
912 impl<'a> DisplayText for TestExplanation<'a> {
913 fn fmt_text(&self, f: &mut fmt::Formatter<'_>, _ctx: &mut ()) -> fmt::Result {
914 let lhs = &self.expr.lhs;
915 let rhs = &self.expr.rhs;
916 writeln!(f, "expr = {lhs} + {rhs}")?;
917
918 if self.context.config.timing {
919 let since = &self.context.frontiers.since;
920 let upper = &self.context.frontiers.upper;
921 writeln!(f, "at t ∊ [{since}, {upper})")?;
922 }
923
924 let name = &self.context.env.name;
925 writeln!(f, "env = {name}")?;
926
927 Ok(())
928 }
929 }
930
931 impl<'a> Explain<'a> for TestExpr {
932 type Context = ExplainContext<'a>;
933 type Text = TestExplanation<'a>;
934 type Json = UnsupportedFormat;
935 type Dot = UnsupportedFormat;
936
937 fn explain_text(
938 &'a mut self,
939 context: &'a Self::Context,
940 ) -> Result<Self::Text, ExplainError> {
941 Ok(TestExplanation {
942 expr: self,
943 context,
944 })
945 }
946 }
947
948 fn do_explain(
949 env: &mut Environment,
950 frontiers: Frontiers<u64>,
951 ) -> Result<String, ExplainError> {
952 let mut expr = TestExpr { lhs: 1, rhs: 2 };
953
954 let format = ExplainFormat::Text;
955 let config = &ExplainConfig {
956 redacted: false,
957 arity: false,
958 cardinality: false,
959 column_names: false,
960 filter_pushdown: false,
961 humanized_exprs: false,
962 join_impls: false,
963 keys: false,
964 linear_chains: false,
965 no_fast_path: false,
966 no_notices: false,
967 node_ids: false,
968 non_negative: false,
969 raw_plans: false,
970 raw_syntax: false,
971 verbose_syntax: true,
972 subtree_size: false,
973 equivalences: false,
974 timing: true,
975 types: false,
976 features: Default::default(),
977 };
978 let context = ExplainContext {
979 env,
980 config,
981 frontiers,
982 };
983
984 expr.explain(&format, &context)
985 }
986
987 #[mz_ore::test]
988 fn test_mutable_context() {
989 let mut env = Environment::default();
990 let frontiers = Frontiers::<u64>::new(3, 7);
991
992 let act = do_explain(&mut env, frontiers);
993 let exp = "expr = 1 + 2\nat t ∊ [3, 7)\nenv = test env\n".to_string();
994
995 assert_ok!(act);
996 assert_eq!(act.unwrap(), exp);
997 }
998}