use std::sync::Arc;
use polars_error::{polars_bail, PolarsResult};
use super::StructArray;
use crate::array::{Array, MutableArray};
use crate::bitmap::MutableBitmap;
use crate::datatypes::ArrowDataType;
#[derive(Debug)]
pub struct MutableStructArray {
data_type: ArrowDataType,
values: Vec<Box<dyn MutableArray>>,
validity: Option<MutableBitmap>,
}
fn check(
data_type: &ArrowDataType,
values: &[Box<dyn MutableArray>],
validity: Option<usize>,
) -> PolarsResult<()> {
let fields = StructArray::try_get_fields(data_type)?;
if fields.is_empty() {
polars_bail!(ComputeError: "a StructArray must contain at least one field")
}
if fields.len() != values.len() {
polars_bail!(ComputeError: "a StructArray must have a number of fields in its DataType equal to the number of child values")
}
fields
.iter().map(|a| &a.data_type)
.zip(values.iter().map(|a| a.data_type()))
.enumerate()
.try_for_each(|(index, (data_type, child))| {
if data_type != child {
polars_bail!(ComputeError:
"The children DataTypes of a StructArray must equal the children data types.
However, the field {index} has data type {data_type:?} but the value has data type {child:?}"
)
} else {
Ok(())
}
})?;
let len = values[0].len();
values
.iter()
.map(|a| a.len())
.enumerate()
.try_for_each(|(index, a_len)| {
if a_len != len {
polars_bail!(ComputeError:
"The children must have an equal number of values.
However, the values at index {index} have a length of {a_len}, which is different from values at index 0, {len}."
)
} else {
Ok(())
}
})?;
if validity.map_or(false, |validity| validity != len) {
polars_bail!(ComputeError:
"the validity length of a StructArray must match its number of elements",
)
}
Ok(())
}
impl From<MutableStructArray> for StructArray {
fn from(other: MutableStructArray) -> Self {
let validity = if other.validity.as_ref().map(|x| x.unset_bits()).unwrap_or(0) > 0 {
other.validity.map(|x| x.into())
} else {
None
};
StructArray::new(
other.data_type,
other.values.into_iter().map(|mut v| v.as_box()).collect(),
validity,
)
}
}
impl MutableStructArray {
pub fn new(data_type: ArrowDataType, values: Vec<Box<dyn MutableArray>>) -> Self {
Self::try_new(data_type, values, None).unwrap()
}
pub fn try_new(
data_type: ArrowDataType,
values: Vec<Box<dyn MutableArray>>,
validity: Option<MutableBitmap>,
) -> PolarsResult<Self> {
check(&data_type, &values, validity.as_ref().map(|x| x.len()))?;
Ok(Self {
data_type,
values,
validity,
})
}
pub fn into_inner(
self,
) -> (
ArrowDataType,
Vec<Box<dyn MutableArray>>,
Option<MutableBitmap>,
) {
(self.data_type, self.values, self.validity)
}
pub fn mut_values(&mut self) -> &mut Vec<Box<dyn MutableArray>> {
&mut self.values
}
pub fn values(&self) -> &Vec<Box<dyn MutableArray>> {
&self.values
}
pub fn value<A: MutableArray + 'static>(&mut self, i: usize) -> Option<&mut A> {
self.values[i].as_mut_any().downcast_mut::<A>()
}
}
impl MutableStructArray {
pub fn reserve(&mut self, additional: usize) {
for v in &mut self.values {
v.reserve(additional);
}
if let Some(x) = self.validity.as_mut() {
x.reserve(additional)
}
}
pub fn push(&mut self, valid: bool) {
match &mut self.validity {
Some(validity) => validity.push(valid),
None => match valid {
true => (),
false => self.init_validity(),
},
};
}
fn push_null(&mut self) {
for v in &mut self.values {
v.push_null();
}
self.push(false);
}
fn init_validity(&mut self) {
let mut validity = MutableBitmap::with_capacity(self.values.capacity());
let len = self.len();
if len > 0 {
validity.extend_constant(len, true);
validity.set(len - 1, false);
}
self.validity = Some(validity)
}
pub fn into_arc(self) -> Arc<dyn Array> {
let a: StructArray = self.into();
Arc::new(a)
}
pub fn shrink_to_fit(&mut self) {
for v in &mut self.values {
v.shrink_to_fit();
}
if let Some(validity) = self.validity.as_mut() {
validity.shrink_to_fit()
}
}
}
impl MutableArray for MutableStructArray {
fn len(&self) -> usize {
self.values.first().map(|v| v.len()).unwrap_or(0)
}
fn validity(&self) -> Option<&MutableBitmap> {
self.validity.as_ref()
}
fn as_box(&mut self) -> Box<dyn Array> {
StructArray::new(
self.data_type.clone(),
std::mem::take(&mut self.values)
.into_iter()
.map(|mut v| v.as_box())
.collect(),
std::mem::take(&mut self.validity).map(|x| x.into()),
)
.boxed()
}
fn as_arc(&mut self) -> Arc<dyn Array> {
StructArray::new(
self.data_type.clone(),
std::mem::take(&mut self.values)
.into_iter()
.map(|mut v| v.as_box())
.collect(),
std::mem::take(&mut self.validity).map(|x| x.into()),
)
.arced()
}
fn data_type(&self) -> &ArrowDataType {
&self.data_type
}
fn as_any(&self) -> &dyn std::any::Any {
self
}
fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
self
}
fn push_null(&mut self) {
self.push_null()
}
fn shrink_to_fit(&mut self) {
self.shrink_to_fit()
}
fn reserve(&mut self, additional: usize) {
self.reserve(additional)
}
}