Struct re_sdk::external::arrow2::array::Utf8Array

source ·
pub struct Utf8Array<O>
where O: Offset,
{ /* private fields */ }
Expand description

A Utf8Array is arrow’s semantic equivalent of an immutable Vec<Option<String>>. Cloning and slicing this struct is O(1).

§Example

use re_arrow2::bitmap::Bitmap;
use re_arrow2::buffer::Buffer;
use re_arrow2::array::Utf8Array;
let array = Utf8Array::<i32>::from([Some("hi"), None, Some("there")]);
assert_eq!(array.value(0), "hi");
assert_eq!(array.iter().collect::<Vec<_>>(), vec![Some("hi"), None, Some("there")]);
assert_eq!(array.values_iter().collect::<Vec<_>>(), vec!["hi", "", "there"]);
// the underlying representation
assert_eq!(array.validity(), Some(&Bitmap::from([true, false, true])));
assert_eq!(array.values(), &Buffer::from(b"hithere".to_vec()));
assert_eq!(array.offsets().buffer(), &Buffer::from(vec![0, 2, 2, 2 + 5]));

§Generic parameter

The generic parameter Offset can only be i32 or i64 and tradeoffs maximum array length with memory usage:

  • the sum of lengths of all elements cannot exceed Offset::MAX
  • the total size of the underlying data is array.len() * size_of::<Offset>() + sum of lengths of all elements

§Safety

The following invariants hold:

  • Two consecutives offsets casted (as) to usize are valid slices of values.
  • A slice of values taken from two consecutives offsets is valid utf8.
  • len is equal to validity.len(), when defined.

Implementations§

source§

impl<O> Utf8Array<O>
where O: Offset,

source

pub fn try_new( data_type: DataType, offsets: OffsetsBuffer<O>, values: Buffer<u8>, validity: Option<Bitmap> ) -> Result<Utf8Array<O>, Error>

Returns a Utf8Array created from its internal representation.

§Errors

This function returns an error iff:

  • The last offset is not equal to the values’ length.
  • the validity’s length is not equal to offsets.len().
  • The data_type’s crate::datatypes::PhysicalType is not equal to either Utf8 or LargeUtf8.
  • The values between two consecutive offsets are not valid utf8
§Implementation

This function is O(N) - checking utf8 is O(N)

source

pub fn from_slice<T, P>(slice: P) -> Utf8Array<O>
where T: AsRef<str>, P: AsRef<[T]>,

Returns a Utf8Array from a slice of &str.

A convenience method that uses Self::from_trusted_len_values_iter.

source

pub fn from<T, P>(slice: P) -> Utf8Array<O>
where T: AsRef<str>, P: AsRef<[Option<T>]>,

Returns a new Utf8Array from a slice of &str.

A convenience method that uses Self::from_trusted_len_iter.

source

pub fn iter( &self ) -> ZipValidity<&str, ArrayValuesIter<'_, Utf8Array<O>>, BitmapIter<'_>>

Returns an iterator of Option<&str>

source

pub fn values_iter(&self) -> ArrayValuesIter<'_, Utf8Array<O>>

Returns an iterator of &str

source

pub fn len(&self) -> usize

Returns the length of this array

source

pub fn value(&self, i: usize) -> &str

Returns the value of the element at index i, ignoring the array’s validity.

§Panic

This function panics iff i >= self.len.

source

pub unsafe fn value_unchecked(&self, i: usize) -> &str

Returns the value of the element at index i, ignoring the array’s validity.

§Safety

This function is safe iff i < self.len.

source

pub fn get(&self, i: usize) -> Option<&str>

Returns the element at index i or None if it is null

§Panics

iff i >= self.len()

source

pub fn data_type(&self) -> &DataType

Returns the DataType of this array.

source

pub fn values(&self) -> &Buffer<u8>

Returns the values of this Utf8Array.

source

pub fn offsets(&self) -> &OffsetsBuffer<O>

Returns the offsets of this Utf8Array.

source

pub fn validity(&self) -> Option<&Bitmap>

The optional validity.

source

pub fn slice(&mut self, offset: usize, length: usize)

Slices this Utf8Array.

§Implementation

This function is O(1).

§Panics

iff offset + length > self.len().

source

pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize)

Slices this Utf8Array.

§Implementation

This function is O(1)

§Safety

The caller must ensure that offset + length <= self.len().

source

pub fn sliced(self, offset: usize, length: usize) -> Utf8Array<O>

Returns this array sliced.

§Implementation

This function is O(1).

§Panics

iff offset + length > self.len().

source

pub unsafe fn sliced_unchecked( self, offset: usize, length: usize ) -> Utf8Array<O>

Returns this array sliced.

§Implementation

This function is O(1).

§Safety

The caller must ensure that offset + length <= self.len().

source

pub fn with_validity(self, validity: Option<Bitmap>) -> Utf8Array<O>

Returns this array with a new validity.

§Panic

Panics iff validity.len() != self.len().

source

pub fn set_validity(&mut self, validity: Option<Bitmap>)

Sets the validity of this array.

§Panics

This function panics iff values.len() != self.len().

source

pub fn boxed(self) -> Box<dyn Array>

Boxes this array into a Box<dyn Array>.

source

pub fn arced(self) -> Arc<dyn Array>

Arcs this array into a std::sync::Arc<dyn Array>.

source

pub fn into_inner( self ) -> (DataType, OffsetsBuffer<O>, Buffer<u8>, Option<Bitmap>)

Returns its internal representation

source

pub fn into_mut(self) -> Either<Utf8Array<O>, MutableUtf8Array<O>>

Try to convert this Utf8Array to a MutableUtf8Array

source

pub fn new_empty(data_type: DataType) -> Utf8Array<O>

Returns a new empty Utf8Array.

The array is guaranteed to have no elements nor validity.

source

pub fn new_null(data_type: DataType, length: usize) -> Utf8Array<O>

Returns a new Utf8Array whose all slots are null / None.

source

pub fn default_data_type() -> DataType

Returns a default DataType of this array, which depends on the generic parameter O: DataType::Utf8 or DataType::LargeUtf8

source

pub unsafe fn try_new_unchecked( data_type: DataType, offsets: OffsetsBuffer<O>, values: Buffer<u8>, validity: Option<Bitmap> ) -> Result<Utf8Array<O>, Error>

Creates a new Utf8Array without checking for offsets monotinicity nor utf8-validity

§Errors

This function returns an error iff:

  • The last offset is not equal to the values’ length.
  • the validity’s length is not equal to offsets.len().
  • The data_type’s crate::datatypes::PhysicalType is not equal to either Utf8 or LargeUtf8.
§Safety

This function is unsound iff:

  • The values between two consecutive offsets are not valid utf8
§Implementation

This function is O(1)

source

pub fn new( data_type: DataType, offsets: OffsetsBuffer<O>, values: Buffer<u8>, validity: Option<Bitmap> ) -> Utf8Array<O>

Creates a new Utf8Array.

§Panics

This function panics iff:

  • The last offset is not equal to the values’ length.
  • the validity’s length is not equal to offsets.len().
  • The data_type’s crate::datatypes::PhysicalType is not equal to either Utf8 or LargeUtf8.
  • The values between two consecutive offsets are not valid utf8
§Implementation

This function is O(N) - checking utf8 is O(N)

source

pub unsafe fn new_unchecked( data_type: DataType, offsets: OffsetsBuffer<O>, values: Buffer<u8>, validity: Option<Bitmap> ) -> Utf8Array<O>

Creates a new Utf8Array without checking for offsets monotinicity.

§Errors

This function returns an error iff:

  • The last offset is not equal to the values’ length.
  • the validity’s length is not equal to offsets.len().
  • The data_type’s crate::datatypes::PhysicalType is not equal to either Utf8 or LargeUtf8.
§Safety

This function is unsound iff:

  • the offsets are not monotonically increasing
  • The values between two consecutive offsets are not valid utf8
§Implementation

This function is O(1)

source

pub fn from_trusted_len_values_iter<T, I>(iterator: I) -> Utf8Array<O>
where T: AsRef<str>, I: TrustedLen<Item = T>,

Returns a (non-null) Utf8Array created from a TrustedLen of &str.

§Implementation

This function is O(N)

source

pub fn from_iter_values<T, I>(iterator: I) -> Utf8Array<O>
where T: AsRef<str>, I: Iterator<Item = T>,

Creates a new Utf8Array from a Iterator of &str.

source

pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Utf8Array<O>
where P: AsRef<str>, I: Iterator<Item = Option<P>>,

Creates a Utf8Array from an iterator of trusted length.

§Safety

The iterator must be TrustedLen. I.e. that size_hint().1 correctly reports its length.

source

pub fn from_trusted_len_iter<I, P>(iterator: I) -> Utf8Array<O>
where P: AsRef<str>, I: TrustedLen<Item = Option<P>>,

Creates a Utf8Array from an iterator of trusted length.

source

pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>( iterator: I ) -> Result<Utf8Array<O>, E>
where P: AsRef<str>, I: IntoIterator<Item = Result<Option<P>, E>>,

Creates a Utf8Array from an falible iterator of trusted length.

§Safety

The iterator must be TrustedLen. I.e. that size_hint().1 correctly reports its length.

source

pub fn try_from_trusted_len_iter<E, I, P>(iter: I) -> Result<Utf8Array<O>, E>
where P: AsRef<str>, I: TrustedLen<Item = Result<Option<P>, E>>,

Creates a Utf8Array from an fallible iterator of trusted length.

source

pub fn apply_validity<F>(&mut self, f: F)
where F: FnOnce(Bitmap) -> Bitmap,

Applies a function f to the validity of this array.

This is an API to leverage clone-on-write

§Panics

This function panics if the function f modifies the length of the Bitmap.

Trait Implementations§

source§

impl<O> Array for Utf8Array<O>
where O: Offset,

source§

fn as_any(&self) -> &(dyn Any + 'static)

Converts itself to a reference of Any, which enables downcasting to concrete types.
source§

fn as_any_mut(&mut self) -> &mut (dyn Any + 'static)

Converts itself to a mutable reference of Any, which enables mutable downcasting to concrete types.
source§

fn len(&self) -> usize

The length of the Array. Every array has a length corresponding to the number of elements (slots).
source§

fn data_type(&self) -> &DataType

The DataType of the Array. In combination with Array::as_any, this can be used to downcast trait objects (dyn Array) to concrete arrays.
source§

fn slice(&mut self, offset: usize, length: usize)

Slices this Array. Read more
source§

unsafe fn slice_unchecked(&mut self, offset: usize, length: usize)

Slices the Array. Read more
source§

fn to_boxed(&self) -> Box<dyn Array>

Clone a &dyn Array to an owned Box<dyn Array>.
source§

fn validity(&self) -> Option<&Bitmap>

The validity of the Array: every array has an optional Bitmap that, when available specifies whether the array slot is valid or not (null). When the validity is None, all slots are valid.
source§

fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array>

Clones this Array with a new new assigned bitmap. Read more
source§

fn is_empty(&self) -> bool

whether the array is empty
source§

fn null_count(&self) -> usize

The number of null slots on this Array. Read more
source§

fn is_null(&self, i: usize) -> bool

Returns whether slot i is null. Read more
source§

unsafe fn is_null_unchecked(&self, i: usize) -> bool

Returns whether slot i is null. Read more
source§

fn is_valid(&self, i: usize) -> bool

Returns whether slot i is valid. Read more
source§

fn sliced(&self, offset: usize, length: usize) -> Box<dyn Array>

Returns a slice of this Array. Read more
source§

unsafe fn sliced_unchecked( &self, offset: usize, length: usize ) -> Box<dyn Array>

Returns a slice of this Array. Read more
source§

impl<O> Clone for Utf8Array<O>
where O: Clone + Offset,

source§

fn clone(&self) -> Utf8Array<O>

Returns a copy of the value. Read more
1.0.0 · source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
source§

impl<O> Debug for Utf8Array<O>
where O: Offset,

source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

Formats the value using the given formatter. Read more
source§

impl<O> Default for Utf8Array<O>
where O: Offset,

source§

fn default() -> Utf8Array<O>

Returns the “default value” for a type. Read more
source§

impl<'a, O> From<GrowableUtf8<'a, O>> for Utf8Array<O>
where O: Offset,

source§

fn from(val: GrowableUtf8<'a, O>) -> Utf8Array<O>

Converts to this type from the input type.
source§

impl<O> From<MutableUtf8Array<O>> for Utf8Array<O>
where O: Offset,

source§

fn from(other: MutableUtf8Array<O>) -> Utf8Array<O>

Converts to this type from the input type.
source§

impl<O> From<MutableUtf8ValuesArray<O>> for Utf8Array<O>
where O: Offset,

source§

fn from(other: MutableUtf8ValuesArray<O>) -> Utf8Array<O>

Converts to this type from the input type.
source§

impl<O, P> FromIterator<Option<P>> for Utf8Array<O>
where O: Offset, P: AsRef<str>,

source§

fn from_iter<I>(iter: I) -> Utf8Array<O>
where I: IntoIterator<Item = Option<P>>,

Creates a value from an iterator. Read more
source§

impl<O> GenericBinaryArray<O> for Utf8Array<O>
where O: Offset,

source§

fn values(&self) -> &[u8]

The values of the array
source§

fn offsets(&self) -> &[O]

The offsets of the array
source§

impl<'a, O> IntoIterator for &'a Utf8Array<O>
where O: Offset,

§

type Item = Option<&'a str>

The type of the elements being iterated over.
§

type IntoIter = ZipValidity<&'a str, ArrayValuesIter<'a, Utf8Array<O>>, BitmapIter<'a>>

Which kind of iterator are we turning this into?
source§

fn into_iter(self) -> <&'a Utf8Array<O> as IntoIterator>::IntoIter

Creates an iterator from a value. Read more
source§

impl<O> PartialEq<&(dyn Array + 'static)> for Utf8Array<O>
where O: Offset,

source§

fn eq(&self, other: &&(dyn Array + 'static)) -> bool

This method tests for self and other values to be equal, and is used by ==.
1.0.0 · source§

fn ne(&self, other: &Rhs) -> bool

This method tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.
source§

impl<O> PartialEq<Utf8Array<O>> for &(dyn Array + 'static)
where O: Offset,

source§

fn eq(&self, other: &Utf8Array<O>) -> bool

This method tests for self and other values to be equal, and is used by ==.
1.0.0 · source§

fn ne(&self, other: &Rhs) -> bool

This method tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.
source§

impl<O> PartialEq for Utf8Array<O>
where O: Offset,

source§

fn eq(&self, other: &Utf8Array<O>) -> bool

This method tests for self and other values to be equal, and is used by ==.
1.0.0 · source§

fn ne(&self, other: &Rhs) -> bool

This method tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.

Auto Trait Implementations§

§

impl<O> Freeze for Utf8Array<O>

§

impl<O> RefUnwindSafe for Utf8Array<O>

§

impl<O> Send for Utf8Array<O>

§

impl<O> Sync for Utf8Array<O>

§

impl<O> Unpin for Utf8Array<O>

§

impl<O> UnwindSafe for Utf8Array<O>

Blanket Implementations§

source§

impl<T> Any for T
where T: 'static + ?Sized,

source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
source§

impl<T> Az for T

source§

fn az<Dst>(self) -> Dst
where T: Cast<Dst>,

Casts the value.
source§

impl<T> Borrow<T> for T
where T: ?Sized,

source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
source§

impl<Src, Dst> CastFrom<Src> for Dst
where Src: Cast<Dst>,

source§

fn cast_from(src: Src) -> Dst

Casts the value.
source§

impl<T> CheckedAs for T

source§

fn checked_as<Dst>(self) -> Option<Dst>
where T: CheckedCast<Dst>,

Casts the value.
source§

impl<Src, Dst> CheckedCastFrom<Src> for Dst
where Src: CheckedCast<Dst>,

source§

fn checked_cast_from(src: Src) -> Option<Dst>

Casts the value.
source§

impl<T> DynClone for T
where T: Clone,

source§

fn __clone_box(&self, _: Private) -> *mut ()

source§

impl<T> From<T> for T

source§

fn from(t: T) -> T

Returns the argument unchanged.

source§

impl<T> Instrument for T

source§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more
source§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
source§

impl<T, U> Into<U> for T
where U: From<T>,

source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

source§

impl<T> IntoEither for T

source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
source§

impl<Src, Dst> LosslessTryInto<Dst> for Src
where Dst: LosslessTryFrom<Src>,

source§

fn lossless_try_into(self) -> Option<Dst>

Performs the conversion.
source§

impl<Src, Dst> LossyInto<Dst> for Src
where Dst: LossyFrom<Src>,

source§

fn lossy_into(self) -> Dst

Performs the conversion.
source§

impl<T> OverflowingAs for T

source§

fn overflowing_as<Dst>(self) -> (Dst, bool)
where T: OverflowingCast<Dst>,

Casts the value.
source§

impl<Src, Dst> OverflowingCastFrom<Src> for Dst
where Src: OverflowingCast<Dst>,

source§

fn overflowing_cast_from(src: Src) -> (Dst, bool)

Casts the value.
source§

impl<T> Pointable for T

source§

const ALIGN: usize = _

The alignment of pointer.
§

type Init = T

The type for initializers.
source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
source§

impl<T> Same for T

§

type Output = T

Should always be Self
source§

impl<T> SaturatingAs for T

source§

fn saturating_as<Dst>(self) -> Dst
where T: SaturatingCast<Dst>,

Casts the value.
source§

impl<Src, Dst> SaturatingCastFrom<Src> for Dst
where Src: SaturatingCast<Dst>,

source§

fn saturating_cast_from(src: Src) -> Dst

Casts the value.
source§

impl<T> ToOwned for T
where T: Clone,

§

type Owned = T

The resulting type after obtaining ownership.
source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

§

type Error = Infallible

The type returned in the event of a conversion error.
source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
source§

impl<T> UnwrappedAs for T

source§

fn unwrapped_as<Dst>(self) -> Dst
where T: UnwrappedCast<Dst>,

Casts the value.
source§

impl<Src, Dst> UnwrappedCastFrom<Src> for Dst
where Src: UnwrappedCast<Dst>,

source§

fn unwrapped_cast_from(src: Src) -> Dst

Casts the value.
source§

impl<T> WithSubscriber for T

source§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more
source§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more
source§

impl<T> WrappingAs for T

source§

fn wrapping_as<Dst>(self) -> Dst
where T: WrappingCast<Dst>,

Casts the value.
source§

impl<Src, Dst> WrappingCastFrom<Src> for Dst
where Src: WrappingCast<Dst>,

source§

fn wrapping_cast_from(src: Src) -> Dst

Casts the value.