1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
//! Defines physical expressions for APPROX_MEDIAN that can be evaluated MEDIAN at runtime during query execution
use crate::aggregate::utils::down_cast_any_ref;
use crate::expressions::{lit, ApproxPercentileCont};
use crate::{AggregateExpr, PhysicalExpr};
use arrow::{datatypes::DataType, datatypes::Field};
use datafusion_common::Result;
use datafusion_expr::Accumulator;
use std::any::Any;
use std::sync::Arc;
/// MEDIAN aggregate expression
#[derive(Debug)]
pub struct ApproxMedian {
name: String,
expr: Arc<dyn PhysicalExpr>,
data_type: DataType,
approx_percentile: ApproxPercentileCont,
}
impl ApproxMedian {
/// Create a new APPROX_MEDIAN aggregate function
pub fn try_new(
expr: Arc<dyn PhysicalExpr>,
name: impl Into<String>,
data_type: DataType,
) -> Result<Self> {
let name: String = name.into();
let approx_percentile = ApproxPercentileCont::new(
vec![expr.clone(), lit(0.5_f64)],
name.clone(),
data_type.clone(),
)?;
Ok(Self {
name,
expr,
data_type,
approx_percentile,
})
}
}
impl AggregateExpr for ApproxMedian {
/// Return a reference to Any that can be used for downcasting
fn as_any(&self) -> &dyn Any {
self
}
fn field(&self) -> Result<Field> {
Ok(Field::new(&self.name, self.data_type.clone(), true))
}
fn create_accumulator(&self) -> Result<Box<dyn Accumulator>> {
self.approx_percentile.create_accumulator()
}
fn state_fields(&self) -> Result<Vec<Field>> {
self.approx_percentile.state_fields()
}
fn expressions(&self) -> Vec<Arc<dyn PhysicalExpr>> {
vec![self.expr.clone()]
}
fn name(&self) -> &str {
&self.name
}
}
impl PartialEq<dyn Any> for ApproxMedian {
fn eq(&self, other: &dyn Any) -> bool {
down_cast_any_ref(other)
.downcast_ref::<Self>()
.map(|x| {
self.name == x.name
&& self.data_type == x.data_type
&& self.expr.eq(&x.expr)
&& self.approx_percentile == x.approx_percentile
})
.unwrap_or(false)
}
}