1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60
use super::{Field, Metadata};
#[cfg(feature = "serde_types")]
use serde_derive::{Deserialize, Serialize};
/// An ordered sequence of [`Field`]s with associated [`Metadata`].
///
/// [`Schema`] is an abstration used to read from, and write to, Arrow IPC format,
/// Apache Parquet, and Apache Avro. All these formats have a concept of a schema
/// with fields and metadata.
#[derive(Debug, Clone, PartialEq, Eq, Default)]
#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
pub struct Schema {
/// The fields composing this schema.
pub fields: Vec<Field>,
/// Optional metadata.
pub metadata: Metadata,
}
impl Schema {
/// Attaches a [`Metadata`] to [`Schema`]
#[inline]
pub fn with_metadata(self, metadata: Metadata) -> Self {
Self {
fields: self.fields,
metadata,
}
}
/// Returns a new [`Schema`] with a subset of all fields whose `predicate`
/// evaluates to true.
pub fn filter<F: Fn(usize, &Field) -> bool>(self, predicate: F) -> Self {
let fields = self
.fields
.into_iter()
.enumerate()
.filter_map(|(index, f)| {
if (predicate)(index, &f) {
Some(f)
} else {
None
}
})
.collect();
Schema {
fields,
metadata: self.metadata,
}
}
}
impl From<Vec<Field>> for Schema {
fn from(fields: Vec<Field>) -> Self {
Self {
fields,
..Default::default()
}
}
}