use fmt::Debug;
use std::any::Any;
use std::fmt;
use arrow::{
datatypes::Field,
datatypes::{DataType, Schema},
};
use super::{
expressions::format_state_name, type_coercion::coerce, Accumulator, AggregateExpr,
};
use crate::error::Result;
use crate::physical_plan::PhysicalExpr;
pub use datafusion_expr::AggregateUDF;
use std::sync::Arc;
pub fn create_aggregate_expr(
fun: &AggregateUDF,
input_phy_exprs: &[Arc<dyn PhysicalExpr>],
input_schema: &Schema,
name: impl Into<String>,
) -> Result<Arc<dyn AggregateExpr>> {
let coerced_phy_exprs = coerce(input_phy_exprs, input_schema, &fun.signature)?;
let coerced_exprs_types = coerced_phy_exprs
.iter()
.map(|arg| arg.data_type(input_schema))
.collect::<Result<Vec<_>>>()?;
Ok(Arc::new(AggregateFunctionExpr {
fun: fun.clone(),
args: coerced_phy_exprs.clone(),
data_type: (fun.return_type)(&coerced_exprs_types)?.as_ref().clone(),
name: name.into(),
}))
}
#[derive(Debug)]
pub struct AggregateFunctionExpr {
fun: AggregateUDF,
args: Vec<Arc<dyn PhysicalExpr>>,
data_type: DataType,
name: String,
}
impl AggregateExpr for AggregateFunctionExpr {
fn as_any(&self) -> &dyn Any {
self
}
fn expressions(&self) -> Vec<Arc<dyn PhysicalExpr>> {
self.args.clone()
}
fn state_fields(&self) -> Result<Vec<Field>> {
let fields = (self.fun.state_type)(&self.data_type)?
.iter()
.enumerate()
.map(|(i, data_type)| {
Field::new(
&format_state_name(&self.name, &format!("{}", i)),
data_type.clone(),
true,
)
})
.collect::<Vec<Field>>();
Ok(fields)
}
fn field(&self) -> Result<Field> {
Ok(Field::new(&self.name, self.data_type.clone(), true))
}
fn create_accumulator(&self) -> Result<Box<dyn Accumulator>> {
(self.fun.accumulator)()
}
fn name(&self) -> &str {
&self.name
}
}