From 41d286731230d11d1c452f4b97a40bca2ce9e044 Mon Sep 17 00:00:00 2001 From: Jay Zhan Date: Sun, 21 Apr 2024 11:15:39 +0800 Subject: [PATCH] Minor: Support more args for udaf (#10146) * support more args for udaf Signed-off-by: jayzhan211 * fmt Signed-off-by: jayzhan211 --------- Signed-off-by: jayzhan211 --- datafusion-cli/Cargo.lock | 1 + datafusion/functions-aggregate/Cargo.toml | 1 + .../functions-aggregate/src/first_last.rs | 2 +- datafusion/functions-aggregate/src/macros.rs | 21 ++++++++++++------- .../tests/cases/roundtrip_logical_plan.rs | 2 +- 5 files changed, 17 insertions(+), 10 deletions(-) diff --git a/datafusion-cli/Cargo.lock b/datafusion-cli/Cargo.lock index 5ce5beab4d709..9a27d7fff923b 100644 --- a/datafusion-cli/Cargo.lock +++ b/datafusion-cli/Cargo.lock @@ -1291,6 +1291,7 @@ dependencies = [ "datafusion-physical-expr-common", "log", "paste", + "sqlparser", ] [[package]] diff --git a/datafusion/functions-aggregate/Cargo.toml b/datafusion/functions-aggregate/Cargo.toml index be354acb48515..f976475653644 100644 --- a/datafusion/functions-aggregate/Cargo.toml +++ b/datafusion/functions-aggregate/Cargo.toml @@ -45,3 +45,4 @@ datafusion-expr = { workspace = true } datafusion-physical-expr-common = { workspace = true } log = { workspace = true } paste = "1.0.14" +sqlparser = { workspace = true } diff --git a/datafusion/functions-aggregate/src/first_last.rs b/datafusion/functions-aggregate/src/first_last.rs index d5367ad34163e..1a56b23cd26a0 100644 --- a/datafusion/functions-aggregate/src/first_last.rs +++ b/datafusion/functions-aggregate/src/first_last.rs @@ -36,6 +36,7 @@ use datafusion_physical_expr_common::expressions; use datafusion_physical_expr_common::physical_expr::PhysicalExpr; use datafusion_physical_expr_common::sort_expr::{LexOrdering, PhysicalSortExpr}; use datafusion_physical_expr_common::utils::reverse_order_bys; +use sqlparser::ast::NullTreatment; use std::any::Any; use std::fmt::Debug; use std::sync::Arc; @@ -43,7 +44,6 @@ use std::sync::Arc; make_udaf_function!( FirstValue, first_value, - value, "Returns the first value in a group of values.", first_value_udaf ); diff --git a/datafusion/functions-aggregate/src/macros.rs b/datafusion/functions-aggregate/src/macros.rs index d24c60f932701..04f9fecb8b195 100644 --- a/datafusion/functions-aggregate/src/macros.rs +++ b/datafusion/functions-aggregate/src/macros.rs @@ -16,19 +16,24 @@ // under the License. macro_rules! make_udaf_function { - ($UDAF:ty, $EXPR_FN:ident, $($arg:ident)*, $DOC:expr, $AGGREGATE_UDF_FN:ident) => { + ($UDAF:ty, $EXPR_FN:ident, $DOC:expr, $AGGREGATE_UDF_FN:ident) => { paste::paste! { // "fluent expr_fn" style function #[doc = $DOC] - pub fn $EXPR_FN($($arg: Expr),*) -> Expr { + pub fn $EXPR_FN( + args: Vec, + distinct: bool, + filter: Option>, + order_by: Option>, + null_treatment: Option + ) -> Expr { Expr::AggregateFunction(datafusion_expr::expr::AggregateFunction::new_udf( $AGGREGATE_UDF_FN(), - vec![$($arg),*], - // TODO: Support arguments for `expr` API - false, - None, - None, - None, + args, + distinct, + filter, + order_by, + null_treatment, )) } diff --git a/datafusion/proto/tests/cases/roundtrip_logical_plan.rs b/datafusion/proto/tests/cases/roundtrip_logical_plan.rs index eee15008fbbb8..f97559e03af20 100644 --- a/datafusion/proto/tests/cases/roundtrip_logical_plan.rs +++ b/datafusion/proto/tests/cases/roundtrip_logical_plan.rs @@ -613,7 +613,7 @@ async fn roundtrip_expr_api() -> Result<()> { lit(1), ), array_replace_all(make_array(vec![lit(1), lit(2), lit(3)]), lit(2), lit(4)), - first_value(lit(1)), + first_value(vec![lit(1)], false, None, None, None), ]; // ensure expressions created with the expr api can be round tripped