Skip to content

Commit ee3cfdc

Browse files
committed
Handle one-element array return value in ScalarFunctionExpr
This was done in #12922 only for math functions. We now generalize this fallback to all scalar UDFs.
1 parent 747001a commit ee3cfdc

File tree

3 files changed

+21
-20
lines changed

3 files changed

+21
-20
lines changed

datafusion/expr-common/src/columnar_value.rs

Lines changed: 0 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -217,17 +217,6 @@ impl ColumnarValue {
217217
}
218218
}
219219
}
220-
221-
/// Converts an [`ArrayRef`] to a [`ColumnarValue`] based on the supplied arguments.
222-
/// This is useful for scalar UDF implementations to fulfil their contract:
223-
/// if all arguments are scalar values, the result should also be a scalar value.
224-
pub fn from_args_and_result(args: &[Self], result: ArrayRef) -> Result<Self> {
225-
if result.len() == 1 && args.iter().all(|arg| matches!(arg, Self::Scalar(_))) {
226-
Ok(Self::Scalar(ScalarValue::try_from_array(&result, 0)?))
227-
} else {
228-
Ok(Self::Array(result))
229-
}
230-
}
231220
}
232221

233222
#[cfg(test)]

datafusion/functions/src/macros.rs

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -228,8 +228,8 @@ macro_rules! make_math_unary_udf {
228228
$EVALUATE_BOUNDS(inputs)
229229
}
230230

231-
fn invoke(&self, col_args: &[ColumnarValue]) -> Result<ColumnarValue> {
232-
let args = ColumnarValue::values_to_arrays(col_args)?;
231+
fn invoke(&self, args: &[ColumnarValue]) -> Result<ColumnarValue> {
232+
let args = ColumnarValue::values_to_arrays(args)?;
233233
let arr: ArrayRef = match args[0].data_type() {
234234
DataType::Float64 => {
235235
Arc::new(make_function_scalar_inputs_return_type!(
@@ -257,7 +257,7 @@ macro_rules! make_math_unary_udf {
257257
}
258258
};
259259

260-
ColumnarValue::from_args_and_result(col_args, arr)
260+
Ok(ColumnarValue::Array(arr))
261261
}
262262

263263
fn documentation(&self) -> Option<&Documentation> {
@@ -344,8 +344,8 @@ macro_rules! make_math_binary_udf {
344344
$OUTPUT_ORDERING(input)
345345
}
346346

347-
fn invoke(&self, col_args: &[ColumnarValue]) -> Result<ColumnarValue> {
348-
let args = ColumnarValue::values_to_arrays(col_args)?;
347+
fn invoke(&self, args: &[ColumnarValue]) -> Result<ColumnarValue> {
348+
let args = ColumnarValue::values_to_arrays(args)?;
349349
let arr: ArrayRef = match args[0].data_type() {
350350
DataType::Float64 => Arc::new(make_function_inputs2!(
351351
&args[0],
@@ -372,7 +372,7 @@ macro_rules! make_math_binary_udf {
372372
}
373373
};
374374

375-
ColumnarValue::from_args_and_result(col_args, arr)
375+
Ok(ColumnarValue::Array(arr))
376376
}
377377

378378
fn documentation(&self) -> Option<&Documentation> {

datafusion/physical-expr/src/scalar_function.rs

Lines changed: 15 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,8 @@ use crate::PhysicalExpr;
3939

4040
use arrow::datatypes::{DataType, Schema};
4141
use arrow::record_batch::RecordBatch;
42-
use datafusion_common::{internal_err, DFSchema, Result};
42+
use arrow_array::Array;
43+
use datafusion_common::{internal_err, DFSchema, Result, ScalarValue};
4344
use datafusion_expr::interval_arithmetic::Interval;
4445
use datafusion_expr::sort_properties::ExprProperties;
4546
use datafusion_expr::type_coercion::functions::data_types_with_scalar_udf;
@@ -147,8 +148,19 @@ impl PhysicalExpr for ScalarFunctionExpr {
147148

148149
if let ColumnarValue::Array(array) = &output {
149150
if array.len() != batch.num_rows() {
150-
return internal_err!("UDF returned a different number of rows than expected. Expected: {}, Got: {}",
151-
batch.num_rows(), array.len());
151+
// If the arguments are a non-empty slice of scalar values, we can assume that
152+
// returning a one-element array is equivalent to returning a scalar.
153+
let preserve_scalar = array.len() == 1
154+
&& !inputs.is_empty()
155+
&& inputs
156+
.iter()
157+
.all(|arg| matches!(arg, ColumnarValue::Scalar(_)));
158+
return if preserve_scalar {
159+
ScalarValue::try_from_array(array, 0).map(ColumnarValue::Scalar)
160+
} else {
161+
internal_err!("UDF returned a different number of rows than expected. Expected: {}, Got: {}",
162+
batch.num_rows(), array.len())
163+
};
152164
}
153165
}
154166
Ok(output)

0 commit comments

Comments
 (0)