use fmt::{Debug, Formatter};
use std::{cell::RefCell, fmt, rc::Rc};
use arrow::{
datatypes::Field,
datatypes::{DataType, Schema},
};
use crate::physical_plan::PhysicalExpr;
use crate::{error::Result, logical_plan::Expr};
use super::{
aggregates::AccumulatorFunctionImplementation,
aggregates::StateTypeFunction,
expressions::format_state_name,
functions::{ReturnTypeFunction, Signature},
type_coercion::coerce,
Accumulator, AggregateExpr,
};
use std::sync::Arc;
#[derive(Clone)]
pub struct AggregateUDF {
pub name: String,
pub signature: Signature,
pub return_type: ReturnTypeFunction,
pub accumulator: AccumulatorFunctionImplementation,
pub state_type: StateTypeFunction,
}
impl Debug for AggregateUDF {
fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
f.debug_struct("AggregateUDF")
.field("name", &self.name)
.field("signature", &self.signature)
.field("fun", &"<FUNC>")
.finish()
}
}
impl AggregateUDF {
pub fn new(
name: &str,
signature: &Signature,
return_type: &ReturnTypeFunction,
accumulator: &AccumulatorFunctionImplementation,
state_type: &StateTypeFunction,
) -> Self {
Self {
name: name.to_owned(),
signature: signature.clone(),
return_type: return_type.clone(),
accumulator: accumulator.clone(),
state_type: state_type.clone(),
}
}
pub fn call(&self, args: Vec<Expr>) -> Expr {
Expr::AggregateUDF {
fun: Arc::new(self.clone()),
args,
}
}
}
pub fn create_aggregate_expr(
fun: &AggregateUDF,
args: &Vec<Arc<dyn PhysicalExpr>>,
input_schema: &Schema,
name: String,
) -> Result<Arc<dyn AggregateExpr>> {
let args = coerce(args, input_schema, &fun.signature)?;
let arg_types = args
.iter()
.map(|arg| arg.data_type(input_schema))
.collect::<Result<Vec<_>>>()?;
Ok(Arc::new(AggregateFunctionExpr {
fun: fun.clone(),
args: args.clone(),
data_type: (fun.return_type)(&arg_types)?.as_ref().clone(),
name: name.clone(),
}))
}
#[derive(Debug)]
pub struct AggregateFunctionExpr {
fun: AggregateUDF,
args: Vec<Arc<dyn PhysicalExpr>>,
data_type: DataType,
name: String,
}
impl AggregateExpr for AggregateFunctionExpr {
fn expressions(&self) -> Vec<Arc<dyn PhysicalExpr>> {
self.args.clone()
}
fn state_fields(&self) -> Result<Vec<Field>> {
let fields = (self.fun.state_type)(&self.data_type)?
.iter()
.enumerate()
.map(|(i, data_type)| {
Field::new(
&format_state_name(&self.name, &format!("{}", i)),
data_type.clone(),
true,
)
})
.collect::<Vec<Field>>();
Ok(fields)
}
fn field(&self) -> Result<Field> {
Ok(Field::new(&self.name, self.data_type.clone(), true))
}
fn create_accumulator(&self) -> Result<Rc<RefCell<dyn Accumulator>>> {
(self.fun.accumulator)()
}
}