polars_python/
lazygroupby.rsuse std::sync::Arc;
use polars::lazy::frame::{LazyFrame, LazyGroupBy};
use polars::prelude::{DataFrame, PolarsError, Schema};
use pyo3::prelude::*;
use crate::conversion::Wrap;
use crate::error::PyPolarsErr;
use crate::expr::ToExprs;
use crate::py_modules::polars;
use crate::{PyDataFrame, PyExpr, PyLazyFrame};
#[pyclass]
#[repr(transparent)]
pub struct PyLazyGroupBy {
pub lgb: Option<LazyGroupBy>,
}
#[pymethods]
impl PyLazyGroupBy {
fn agg(&mut self, aggs: Vec<PyExpr>) -> PyLazyFrame {
let lgb = self.lgb.clone().unwrap();
let aggs = aggs.to_exprs();
lgb.agg(aggs).into()
}
fn head(&mut self, n: usize) -> PyLazyFrame {
let lgb = self.lgb.clone().unwrap();
lgb.head(Some(n)).into()
}
fn tail(&mut self, n: usize) -> PyLazyFrame {
let lgb = self.lgb.clone().unwrap();
lgb.tail(Some(n)).into()
}
#[pyo3(signature = (lambda, schema=None))]
fn map_groups(
&mut self,
lambda: PyObject,
schema: Option<Wrap<Schema>>,
) -> PyResult<PyLazyFrame> {
let lgb = self.lgb.clone().unwrap();
let schema = match schema {
Some(schema) => Arc::new(schema.0),
None => LazyFrame::from(lgb.logical_plan.clone())
.collect_schema()
.map_err(PyPolarsErr::from)?,
};
let function = move |df: DataFrame| {
Python::with_gil(|py| {
let pypolars = polars(py).bind(py);
let pydf = PyDataFrame::new(df);
let python_df_wrapper =
pypolars.getattr("wrap_df").unwrap().call1((pydf,)).unwrap();
let result_df_wrapper = lambda.call1(py, (python_df_wrapper,)).map_err(|e| {
PolarsError::ComputeError(
format!("User provided python function failed: {e}").into(),
)
})?;
let py_pydf = result_df_wrapper.getattr(py, "_df").expect(
"Could not get DataFrame attribute '_df'. Make sure that you return a DataFrame object.",
);
let pydf = py_pydf.extract::<PyDataFrame>(py).unwrap();
Ok(pydf.df)
})
};
Ok(lgb.apply(function, schema).into())
}
}