polars_core/chunked_array/ops/
append.rsuse polars_error::constants::LENGTH_LIMIT_MSG;
use crate::prelude::*;
use crate::series::IsSorted;
pub(crate) fn new_chunks(chunks: &mut Vec<ArrayRef>, other: &[ArrayRef], len: usize) {
if chunks.len() == 1 && len == 0 {
other.clone_into(chunks);
} else {
for chunk in other {
if chunk.len() > 0 {
chunks.push(chunk.clone());
}
}
}
}
pub(crate) fn new_chunks_owned(chunks: &mut Vec<ArrayRef>, other: Vec<ArrayRef>, len: usize) {
if chunks.len() == 1 && len == 0 {
*chunks = other;
} else {
chunks.reserve(other.len());
chunks.extend(other.into_iter().filter(|c| c.len() > 0));
}
}
pub(super) fn update_sorted_flag_before_append<T>(ca: &mut ChunkedArray<T>, other: &ChunkedArray<T>)
where
T: PolarsDataType,
for<'a> T::Physical<'a>: TotalOrd,
{
let sorted_flag = match (
ca.null_count() != ca.len(),
other.null_count() != other.len(),
) {
(false, false) => IsSorted::Ascending,
(false, true) => {
if
ca.is_empty()
|| (
other.is_sorted_any() && 1 + other.last_non_null().unwrap() == other.len()
)
{
other.is_sorted_flag()
} else {
IsSorted::Not
}
},
(true, false) => {
if
other.is_empty()
|| (
ca.is_sorted_any() && ca.first_non_null().unwrap() == 0
)
{
ca.is_sorted_flag()
} else {
IsSorted::Not
}
},
(true, true) => {
if !(ca.is_sorted_any() || ca.len() == 1)
|| !(other.is_sorted_any() || other.len() == 1)
|| !(
ca.len() - ca.null_count() == 1
|| other.len() - other.null_count() == 1
|| ca.is_sorted_flag() == other.is_sorted_flag()
)
{
IsSorted::Not
} else {
let l_idx = ca.last_non_null().unwrap();
let r_idx = other.first_non_null().unwrap();
let null_pos_check =
(1 + l_idx == ca.len())
&& (r_idx == 0)
&& !(ca.first_non_null().unwrap() != 0 && 1 + other.last_non_null().unwrap() != other.len());
if !null_pos_check {
IsSorted::Not
} else {
#[allow(unused_assignments)]
let mut out = IsSorted::Not;
let l_val = unsafe { ca.value_unchecked(l_idx) };
let r_val = unsafe { other.value_unchecked(r_idx) };
match (
ca.len() - ca.null_count() == 1,
other.len() - other.null_count() == 1,
) {
(true, true) => {
out = [IsSorted::Descending, IsSorted::Ascending]
[l_val.tot_le(&r_val) as usize];
drop(l_val);
drop(r_val);
ca.set_sorted_flag(out);
return;
},
(true, false) => out = other.is_sorted_flag(),
_ => out = ca.is_sorted_flag(),
}
debug_assert!(!matches!(out, IsSorted::Not));
let check = if matches!(out, IsSorted::Ascending) {
l_val.tot_le(&r_val)
} else {
l_val.tot_ge(&r_val)
};
if !check {
out = IsSorted::Not
}
out
}
}
},
};
ca.set_sorted_flag(sorted_flag);
}
impl<T> ChunkedArray<T>
where
T: PolarsDataType<IsNested = FalseT, IsObject = FalseT>,
for<'a> T::Physical<'a>: TotalOrd,
{
pub fn append(&mut self, other: &Self) -> PolarsResult<()> {
self.append_owned(other.clone())
}
pub fn append_owned(&mut self, mut other: Self) -> PolarsResult<()> {
update_sorted_flag_before_append::<T>(self, &other);
let len = self.len();
self.length = self
.length
.checked_add(other.length)
.ok_or_else(|| polars_err!(ComputeError: LENGTH_LIMIT_MSG))?;
self.null_count += other.null_count;
new_chunks_owned(&mut self.chunks, std::mem::take(&mut other.chunks), len);
Ok(())
}
}
#[doc(hidden)]
impl ListChunked {
pub fn append(&mut self, other: &Self) -> PolarsResult<()> {
self.append_owned(other.clone())
}
pub fn append_owned(&mut self, mut other: Self) -> PolarsResult<()> {
let dtype = merge_dtypes(self.dtype(), other.dtype())?;
self.field = Arc::new(Field::new(self.name().clone(), dtype));
let len = self.len();
self.length = self
.length
.checked_add(other.length)
.ok_or_else(|| polars_err!(ComputeError: LENGTH_LIMIT_MSG))?;
self.null_count += other.null_count;
self.set_sorted_flag(IsSorted::Not);
if !other.get_fast_explode_list() {
self.unset_fast_explode_list()
}
new_chunks_owned(&mut self.chunks, std::mem::take(&mut other.chunks), len);
Ok(())
}
}
#[cfg(feature = "dtype-array")]
#[doc(hidden)]
impl ArrayChunked {
pub fn append(&mut self, other: &Self) -> PolarsResult<()> {
self.append_owned(other.clone())
}
pub fn append_owned(&mut self, mut other: Self) -> PolarsResult<()> {
let dtype = merge_dtypes(self.dtype(), other.dtype())?;
self.field = Arc::new(Field::new(self.name().clone(), dtype));
let len = self.len();
self.length = self
.length
.checked_add(other.length)
.ok_or_else(|| polars_err!(ComputeError: LENGTH_LIMIT_MSG))?;
self.null_count += other.null_count;
self.set_sorted_flag(IsSorted::Not);
new_chunks_owned(&mut self.chunks, std::mem::take(&mut other.chunks), len);
Ok(())
}
}
#[cfg(feature = "dtype-struct")]
#[doc(hidden)]
impl StructChunked {
pub fn append(&mut self, other: &Self) -> PolarsResult<()> {
self.append_owned(other.clone())
}
pub fn append_owned(&mut self, mut other: Self) -> PolarsResult<()> {
let dtype = merge_dtypes(self.dtype(), other.dtype())?;
self.field = Arc::new(Field::new(self.name().clone(), dtype));
let len = self.len();
self.length = self
.length
.checked_add(other.length)
.ok_or_else(|| polars_err!(ComputeError: LENGTH_LIMIT_MSG))?;
self.null_count += other.null_count;
self.set_sorted_flag(IsSorted::Not);
new_chunks_owned(&mut self.chunks, std::mem::take(&mut other.chunks), len);
Ok(())
}
}
#[cfg(feature = "object")]
#[doc(hidden)]
impl<T: PolarsObject> ObjectChunked<T> {
pub fn append(&mut self, other: &Self) -> PolarsResult<()> {
self.append_owned(other.clone())
}
pub fn append_owned(&mut self, mut other: Self) -> PolarsResult<()> {
let len = self.len();
self.length = self
.length
.checked_add(other.length)
.ok_or_else(|| polars_err!(ComputeError: LENGTH_LIMIT_MSG))?;
self.null_count += other.null_count;
self.set_sorted_flag(IsSorted::Not);
new_chunks_owned(&mut self.chunks, std::mem::take(&mut other.chunks), len);
Ok(())
}
}