polars_plan/dsl/functions/
horizontal.rsuse super::*;
#[cfg(feature = "dtype-struct")]
fn cum_fold_dtype() -> GetOutput {
GetOutput::map_fields(|fields| {
let mut st = fields[0].dtype.clone();
for fld in &fields[1..] {
st = get_supertype(&st, &fld.dtype).unwrap();
}
Ok(Field::new(
fields[0].name.clone(),
DataType::Struct(
fields
.iter()
.map(|fld| Field::new(fld.name().clone(), st.clone()))
.collect(),
),
))
})
}
pub fn fold_exprs<F, E>(acc: Expr, f: F, exprs: E) -> Expr
where
F: 'static + Fn(Column, Column) -> PolarsResult<Option<Column>> + Send + Sync,
E: AsRef<[Expr]>,
{
let mut exprs = exprs.as_ref().to_vec();
exprs.push(acc);
let function = new_column_udf(move |columns: &mut [Column]| {
let mut columns = columns.to_vec();
let mut acc = columns.pop().unwrap();
for c in columns {
if let Some(a) = f(acc.clone(), c)? {
acc = a
}
}
Ok(Some(acc))
});
Expr::AnonymousFunction {
input: exprs,
function,
output_type: GetOutput::super_type(),
options: FunctionOptions {
collect_groups: ApplyOptions::GroupWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION
| FunctionFlags::RETURNS_SCALAR,
fmt_str: "fold",
..Default::default()
},
}
}
pub fn reduce_exprs<F, E>(f: F, exprs: E) -> Expr
where
F: 'static + Fn(Column, Column) -> PolarsResult<Option<Column>> + Send + Sync,
E: AsRef<[Expr]>,
{
let exprs = exprs.as_ref().to_vec();
let function = new_column_udf(move |columns: &mut [Column]| {
let mut c_iter = columns.iter();
match c_iter.next() {
Some(acc) => {
let mut acc = acc.clone();
for c in c_iter {
if let Some(a) = f(acc.clone(), c.clone())? {
acc = a
}
}
Ok(Some(acc))
},
None => Err(polars_err!(ComputeError: "`reduce` did not have any expressions to fold")),
}
});
Expr::AnonymousFunction {
input: exprs,
function,
output_type: GetOutput::super_type(),
options: FunctionOptions {
collect_groups: ApplyOptions::GroupWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION
| FunctionFlags::RETURNS_SCALAR,
fmt_str: "reduce",
..Default::default()
},
}
}
#[cfg(feature = "dtype-struct")]
pub fn cum_reduce_exprs<F, E>(f: F, exprs: E) -> Expr
where
F: 'static + Fn(Column, Column) -> PolarsResult<Option<Column>> + Send + Sync,
E: AsRef<[Expr]>,
{
let exprs = exprs.as_ref().to_vec();
let function = new_column_udf(move |columns: &mut [Column]| {
let mut c_iter = columns.iter();
match c_iter.next() {
Some(acc) => {
let mut acc = acc.clone();
let mut result = vec![acc.clone()];
for c in c_iter {
let name = c.name().clone();
if let Some(a) = f(acc.clone(), c.clone())? {
acc = a;
}
acc.rename(name);
result.push(acc.clone());
}
StructChunked::from_columns(acc.name().clone(), result[0].len(), &result)
.map(|ca| Some(ca.into_column()))
},
None => Err(polars_err!(ComputeError: "`reduce` did not have any expressions to fold")),
}
});
Expr::AnonymousFunction {
input: exprs,
function,
output_type: cum_fold_dtype(),
options: FunctionOptions {
collect_groups: ApplyOptions::GroupWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION
| FunctionFlags::RETURNS_SCALAR,
fmt_str: "cum_reduce",
..Default::default()
},
}
}
#[cfg(feature = "dtype-struct")]
pub fn cum_fold_exprs<F, E>(acc: Expr, f: F, exprs: E, include_init: bool) -> Expr
where
F: 'static + Fn(Column, Column) -> PolarsResult<Option<Column>> + Send + Sync,
E: AsRef<[Expr]>,
{
let mut exprs = exprs.as_ref().to_vec();
exprs.push(acc);
let function = new_column_udf(move |columns: &mut [Column]| {
let mut columns = columns.to_vec();
let mut acc = columns.pop().unwrap();
let mut result = vec![];
if include_init {
result.push(acc.clone())
}
for c in columns {
let name = c.name().clone();
if let Some(a) = f(acc.clone(), c)? {
acc = a;
acc.rename(name);
result.push(acc.clone());
}
}
StructChunked::from_columns(acc.name().clone(), result[0].len(), &result)
.map(|ca| Some(ca.into_column()))
});
Expr::AnonymousFunction {
input: exprs,
function,
output_type: cum_fold_dtype(),
options: FunctionOptions {
collect_groups: ApplyOptions::GroupWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION
| FunctionFlags::RETURNS_SCALAR,
fmt_str: "cum_fold",
..Default::default()
},
}
}
pub fn all_horizontal<E: AsRef<[Expr]>>(exprs: E) -> PolarsResult<Expr> {
let exprs = exprs.as_ref().to_vec();
polars_ensure!(!exprs.is_empty(), ComputeError: "cannot return empty fold because the number of output rows is unknown");
Ok(Expr::Function {
input: exprs,
function: FunctionExpr::Boolean(BooleanFunction::AllHorizontal),
options: FunctionOptions {
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION
| FunctionFlags::ALLOW_EMPTY_INPUTS,
..Default::default()
},
})
}
pub fn any_horizontal<E: AsRef<[Expr]>>(exprs: E) -> PolarsResult<Expr> {
let exprs = exprs.as_ref().to_vec();
polars_ensure!(!exprs.is_empty(), ComputeError: "cannot return empty fold because the number of output rows is unknown");
Ok(Expr::Function {
input: exprs,
function: FunctionExpr::Boolean(BooleanFunction::AnyHorizontal),
options: FunctionOptions {
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION
| FunctionFlags::ALLOW_EMPTY_INPUTS,
..Default::default()
},
})
}
pub fn max_horizontal<E: AsRef<[Expr]>>(exprs: E) -> PolarsResult<Expr> {
let exprs = exprs.as_ref().to_vec();
polars_ensure!(!exprs.is_empty(), ComputeError: "cannot return empty fold because the number of output rows is unknown");
Ok(Expr::Function {
input: exprs,
function: FunctionExpr::MaxHorizontal,
options: FunctionOptions {
collect_groups: ApplyOptions::ElementWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION & !FunctionFlags::RETURNS_SCALAR
| FunctionFlags::ALLOW_RENAME,
..Default::default()
},
})
}
pub fn min_horizontal<E: AsRef<[Expr]>>(exprs: E) -> PolarsResult<Expr> {
let exprs = exprs.as_ref().to_vec();
polars_ensure!(!exprs.is_empty(), ComputeError: "cannot return empty fold because the number of output rows is unknown");
Ok(Expr::Function {
input: exprs,
function: FunctionExpr::MinHorizontal,
options: FunctionOptions {
collect_groups: ApplyOptions::ElementWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION & !FunctionFlags::RETURNS_SCALAR
| FunctionFlags::ALLOW_RENAME,
..Default::default()
},
})
}
pub fn sum_horizontal<E: AsRef<[Expr]>>(exprs: E) -> PolarsResult<Expr> {
let exprs = exprs.as_ref().to_vec();
polars_ensure!(!exprs.is_empty(), ComputeError: "cannot return empty fold because the number of output rows is unknown");
Ok(Expr::Function {
input: exprs,
function: FunctionExpr::SumHorizontal,
options: FunctionOptions {
collect_groups: ApplyOptions::ElementWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION & !FunctionFlags::RETURNS_SCALAR,
cast_to_supertypes: None,
..Default::default()
},
})
}
pub fn mean_horizontal<E: AsRef<[Expr]>>(exprs: E) -> PolarsResult<Expr> {
let exprs = exprs.as_ref().to_vec();
polars_ensure!(!exprs.is_empty(), ComputeError: "cannot return empty fold because the number of output rows is unknown");
Ok(Expr::Function {
input: exprs,
function: FunctionExpr::MeanHorizontal,
options: FunctionOptions {
collect_groups: ApplyOptions::ElementWise,
flags: FunctionFlags::default()
| FunctionFlags::INPUT_WILDCARD_EXPANSION & !FunctionFlags::RETURNS_SCALAR,
cast_to_supertypes: None,
..Default::default()
},
})
}
pub fn coalesce(exprs: &[Expr]) -> Expr {
let input = exprs.to_vec();
Expr::Function {
input,
function: FunctionExpr::Coalesce,
options: FunctionOptions {
collect_groups: ApplyOptions::ElementWise,
cast_to_supertypes: Some(Default::default()),
flags: FunctionFlags::default() | FunctionFlags::INPUT_WILDCARD_EXPANSION,
..Default::default()
},
}
}