datafusion_physical_expr/expressions/
not.rsuse std::any::Any;
use std::fmt;
use std::hash::{Hash, Hasher};
use std::sync::Arc;
use crate::physical_expr::down_cast_any_ref;
use crate::PhysicalExpr;
use arrow::datatypes::{DataType, Schema};
use arrow::record_batch::RecordBatch;
use datafusion_common::{cast::as_boolean_array, Result, ScalarValue};
use datafusion_expr::interval_arithmetic::Interval;
use datafusion_expr::ColumnarValue;
#[derive(Debug, Hash)]
pub struct NotExpr {
arg: Arc<dyn PhysicalExpr>,
}
impl NotExpr {
pub fn new(arg: Arc<dyn PhysicalExpr>) -> Self {
Self { arg }
}
pub fn arg(&self) -> &Arc<dyn PhysicalExpr> {
&self.arg
}
}
impl fmt::Display for NotExpr {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
write!(f, "NOT {}", self.arg)
}
}
impl PhysicalExpr for NotExpr {
fn as_any(&self) -> &dyn Any {
self
}
fn data_type(&self, _input_schema: &Schema) -> Result<DataType> {
Ok(DataType::Boolean)
}
fn nullable(&self, input_schema: &Schema) -> Result<bool> {
self.arg.nullable(input_schema)
}
fn evaluate(&self, batch: &RecordBatch) -> Result<ColumnarValue> {
let evaluate_arg = self.arg.evaluate(batch)?;
match evaluate_arg {
ColumnarValue::Array(array) => {
let array = as_boolean_array(&array)?;
Ok(ColumnarValue::Array(Arc::new(
arrow::compute::kernels::boolean::not(array)?,
)))
}
ColumnarValue::Scalar(scalar) => {
if scalar.is_null() {
return Ok(ColumnarValue::Scalar(ScalarValue::Boolean(None)));
}
let bool_value: bool = scalar.try_into()?;
Ok(ColumnarValue::Scalar(ScalarValue::Boolean(Some(
!bool_value,
))))
}
}
}
fn children(&self) -> Vec<&Arc<dyn PhysicalExpr>> {
vec![&self.arg]
}
fn with_new_children(
self: Arc<Self>,
children: Vec<Arc<dyn PhysicalExpr>>,
) -> Result<Arc<dyn PhysicalExpr>> {
Ok(Arc::new(NotExpr::new(Arc::clone(&children[0]))))
}
fn evaluate_bounds(&self, children: &[&Interval]) -> Result<Interval> {
children[0].not()
}
fn dyn_hash(&self, state: &mut dyn Hasher) {
let mut s = state;
self.hash(&mut s);
}
}
impl PartialEq<dyn Any> for NotExpr {
fn eq(&self, other: &dyn Any) -> bool {
down_cast_any_ref(other)
.downcast_ref::<Self>()
.map(|x| self.arg.eq(&x.arg))
.unwrap_or(false)
}
}
pub fn not(arg: Arc<dyn PhysicalExpr>) -> Result<Arc<dyn PhysicalExpr>> {
Ok(Arc::new(NotExpr::new(arg)))
}
#[cfg(test)]
mod tests {
use super::*;
use crate::expressions::col;
use arrow::{array::BooleanArray, datatypes::*};
use std::sync::OnceLock;
#[test]
fn neg_op() -> Result<()> {
let schema = schema();
let expr = not(col("a", &schema)?)?;
assert_eq!(expr.data_type(&schema)?, DataType::Boolean);
assert!(expr.nullable(&schema)?);
let input = BooleanArray::from(vec![Some(true), None, Some(false)]);
let expected = &BooleanArray::from(vec![Some(false), None, Some(true)]);
let batch = RecordBatch::try_new(schema, vec![Arc::new(input)])?;
let result = expr
.evaluate(&batch)?
.into_array(batch.num_rows())
.expect("Failed to convert to array");
let result =
as_boolean_array(&result).expect("failed to downcast to BooleanArray");
assert_eq!(result, expected);
Ok(())
}
#[test]
fn test_evaluate_bounds() -> Result<()> {
assert_evaluate_bounds(
Interval::make(Some(false), Some(true))?,
Interval::make(Some(false), Some(true))?,
)?;
assert_evaluate_bounds(
Interval::make(Some(true), Some(true))?,
Interval::make(Some(false), Some(false))?,
)?;
assert_evaluate_bounds(
Interval::make(Some(false), Some(false))?,
Interval::make(Some(true), Some(true))?,
)?;
Ok(())
}
fn assert_evaluate_bounds(
interval: Interval,
expected_interval: Interval,
) -> Result<()> {
let not_expr = not(col("a", &schema())?)?;
assert_eq!(
not_expr.evaluate_bounds(&[&interval]).unwrap(),
expected_interval
);
Ok(())
}
fn schema() -> SchemaRef {
Arc::clone(SCHEMA.get_or_init(|| {
Arc::new(Schema::new(vec![Field::new("a", DataType::Boolean, true)]))
}))
}
static SCHEMA: OnceLock<SchemaRef> = OnceLock::new();
}