use crate::{
bitmap::Bitmap,
datatypes::{DataType, Field},
error::Error,
offset::OffsetsBuffer,
};
use super::{new_empty_array, specification::try_check_offsets_bounds, Array};
mod ffi;
mod fmt;
mod iterator;
pub use iterator::*;
#[derive(Clone)]
pub struct MapArray {
data_type: DataType,
offsets: OffsetsBuffer<i32>,
field: Box<dyn Array>,
validity: Option<Bitmap>,
}
impl MapArray {
pub fn try_new(
data_type: DataType,
offsets: OffsetsBuffer<i32>,
field: Box<dyn Array>,
validity: Option<Bitmap>,
) -> Result<Self, Error> {
try_check_offsets_bounds(&offsets, field.len())?;
let inner_field = Self::try_get_field(&data_type)?;
if let DataType::Struct(inner) = inner_field.data_type() {
if inner.len() != 2 {
return Err(Error::InvalidArgumentError(
"MapArray's inner `Struct` must have 2 fields (keys and maps)".to_string(),
));
}
} else {
return Err(Error::InvalidArgumentError(
"MapArray expects `DataType::Struct` as its inner logical type".to_string(),
));
}
if field.data_type() != inner_field.data_type() {
return Err(Error::InvalidArgumentError(
"MapArray expects `field.data_type` to match its inner DataType".to_string(),
));
}
if validity
.as_ref()
.map_or(false, |validity| validity.len() != offsets.len())
{
return Err(Error::oos(
"validity mask length must match the number of values",
));
}
Ok(Self {
data_type,
field,
offsets,
validity,
})
}
pub fn new(
data_type: DataType,
offsets: OffsetsBuffer<i32>,
field: Box<dyn Array>,
validity: Option<Bitmap>,
) -> Self {
Self::try_new(data_type, offsets, field, validity).unwrap()
}
pub fn new_null(data_type: DataType, length: usize) -> Self {
let field = new_empty_array(Self::get_field(&data_type).data_type().clone());
Self::new(
data_type,
vec![0i32; 1 + length].try_into().unwrap(),
field,
Some(Bitmap::new_zeroed(length)),
)
}
pub fn new_empty(data_type: DataType) -> Self {
let field = new_empty_array(Self::get_field(&data_type).data_type().clone());
Self::new(data_type, OffsetsBuffer::default(), field, None)
}
#[must_use]
pub fn with_validity(mut self, validity: Option<Bitmap>) -> Self {
self.set_validity(validity);
self
}
pub fn set_validity(&mut self, validity: Option<Bitmap>) {
if matches!(&validity, Some(bitmap) if bitmap.len() != self.len()) {
panic!("validity's length must be equal to the array's length")
}
self.validity = validity;
}
pub fn boxed(self) -> Box<dyn Array> {
Box::new(self)
}
pub fn arced(self) -> std::sync::Arc<dyn Array> {
std::sync::Arc::new(self)
}
}
impl MapArray {
pub fn slice(&self, offset: usize, length: usize) -> Self {
assert!(
offset + length <= self.len(),
"the offset of the new Buffer cannot exceed the existing length"
);
unsafe { self.slice_unchecked(offset, length) }
}
pub unsafe fn slice_unchecked(&self, offset: usize, length: usize) -> Self {
let offsets = self.offsets.clone().slice_unchecked(offset, length + 1);
let validity = self
.validity
.clone()
.map(|bitmap| bitmap.slice_unchecked(offset, length))
.and_then(|bitmap| (bitmap.unset_bits() > 0).then(|| bitmap));
Self {
data_type: self.data_type.clone(),
offsets,
field: self.field.clone(),
validity,
}
}
pub(crate) fn try_get_field(data_type: &DataType) -> Result<&Field, Error> {
if let DataType::Map(field, _) = data_type.to_logical_type() {
Ok(field.as_ref())
} else {
Err(Error::oos(
"The data_type's logical type must be DataType::Map",
))
}
}
pub(crate) fn get_field(data_type: &DataType) -> &Field {
Self::try_get_field(data_type).unwrap()
}
}
impl MapArray {
#[inline]
pub fn len(&self) -> usize {
self.offsets.len()
}
#[inline]
pub fn offsets(&self) -> &OffsetsBuffer<i32> {
&self.offsets
}
#[inline]
pub fn field(&self) -> &Box<dyn Array> {
&self.field
}
#[inline]
pub fn value(&self, i: usize) -> Box<dyn Array> {
assert!(i < self.len());
unsafe { self.value_unchecked(i) }
}
#[inline]
pub unsafe fn value_unchecked(&self, i: usize) -> Box<dyn Array> {
let (start, end) = self.offsets.start_end_unchecked(i);
let length = end - start;
self.field.slice_unchecked(start, length)
}
}
impl Array for MapArray {
#[inline]
fn as_any(&self) -> &dyn std::any::Any {
self
}
#[inline]
fn as_any_mut(&mut self) -> &mut dyn std::any::Any {
self
}
#[inline]
fn len(&self) -> usize {
self.len()
}
#[inline]
fn data_type(&self) -> &DataType {
&self.data_type
}
#[inline]
fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
fn slice(&self, offset: usize, length: usize) -> Box<dyn Array> {
Box::new(self.slice(offset, length))
}
unsafe fn slice_unchecked(&self, offset: usize, length: usize) -> Box<dyn Array> {
Box::new(self.slice_unchecked(offset, length))
}
fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
Box::new(self.clone().with_validity(validity))
}
fn to_boxed(&self) -> Box<dyn Array> {
Box::new(self.clone())
}
}