use std::any::Any;
use std::sync::Arc;
use crate::{
error::{DataFusionError, Result},
logical_expr::StringifiedPlan,
physical_plan::{
common::SizedRecordBatchStream, DisplayFormatType, ExecutionPlan, Partitioning,
Statistics,
},
};
use arrow::{array::StringBuilder, datatypes::SchemaRef, record_batch::RecordBatch};
use log::debug;
use super::{expressions::PhysicalSortExpr, SendableRecordBatchStream};
use crate::execution::context::TaskContext;
use crate::physical_plan::metrics::{ExecutionPlanMetricsSet, MemTrackingMetrics};
#[derive(Debug, Clone)]
pub struct ExplainExec {
schema: SchemaRef,
stringified_plans: Vec<StringifiedPlan>,
verbose: bool,
}
impl ExplainExec {
pub fn new(
schema: SchemaRef,
stringified_plans: Vec<StringifiedPlan>,
verbose: bool,
) -> Self {
ExplainExec {
schema,
stringified_plans,
verbose,
}
}
pub fn stringified_plans(&self) -> &[StringifiedPlan] {
&self.stringified_plans
}
pub fn verbose(&self) -> bool {
self.verbose
}
}
impl ExecutionPlan for ExplainExec {
fn as_any(&self) -> &dyn Any {
self
}
fn schema(&self) -> SchemaRef {
self.schema.clone()
}
fn children(&self) -> Vec<Arc<dyn ExecutionPlan>> {
vec![]
}
fn output_partitioning(&self) -> Partitioning {
Partitioning::UnknownPartitioning(1)
}
fn output_ordering(&self) -> Option<&[PhysicalSortExpr]> {
None
}
fn with_new_children(
self: Arc<Self>,
_: Vec<Arc<dyn ExecutionPlan>>,
) -> Result<Arc<dyn ExecutionPlan>> {
Ok(self)
}
fn execute(
&self,
partition: usize,
context: Arc<TaskContext>,
) -> Result<SendableRecordBatchStream> {
debug!("Start ExplainExec::execute for partition {} of context session_id {} and task_id {:?}", partition, context.session_id(), context.task_id());
if 0 != partition {
return Err(DataFusionError::Internal(format!(
"ExplainExec invalid partition {partition}"
)));
}
let mut type_builder =
StringBuilder::with_capacity(self.stringified_plans.len(), 1024);
let mut plan_builder =
StringBuilder::with_capacity(self.stringified_plans.len(), 1024);
let plans_to_print = self
.stringified_plans
.iter()
.filter(|s| s.should_display(self.verbose));
let mut prev: Option<&StringifiedPlan> = None;
for p in plans_to_print {
type_builder.append_value(p.plan_type.to_string());
match prev {
Some(prev) if !should_show(prev, p) => {
plan_builder.append_value("SAME TEXT AS ABOVE");
}
Some(_) | None => {
plan_builder.append_value(&*p.plan);
}
}
prev = Some(p);
}
let record_batch = RecordBatch::try_new(
self.schema.clone(),
vec![
Arc::new(type_builder.finish()),
Arc::new(plan_builder.finish()),
],
)?;
let metrics = ExecutionPlanMetricsSet::new();
let tracking_metrics =
MemTrackingMetrics::new(&metrics, context.memory_pool(), partition);
debug!(
"Before returning SizedRecordBatch in ExplainExec::execute for partition {} of context session_id {} and task_id {:?}", partition, context.session_id(), context.task_id());
Ok(Box::pin(SizedRecordBatchStream::new(
self.schema.clone(),
vec![Arc::new(record_batch)],
tracking_metrics,
)))
}
fn fmt_as(
&self,
t: DisplayFormatType,
f: &mut std::fmt::Formatter,
) -> std::fmt::Result {
match t {
DisplayFormatType::Default => {
write!(f, "ExplainExec")
}
}
}
fn statistics(&self) -> Statistics {
Statistics::default()
}
}
fn should_show(previous_plan: &StringifiedPlan, this_plan: &StringifiedPlan) -> bool {
(previous_plan.plan != this_plan.plan) || this_plan.should_display(false)
}