pub struct FileSink<'a, W: AsyncWrite + Send + Unpin> {
pub metadata: AHashMap<String, Option<String>>,
/* private fields */
}
Expand description
Sink that writes array chunks
as a Parquet file.
Any values in the sink’s metadata
field will be written to the file’s footer
when the sink is closed.
§Examples
use futures::SinkExt;
use arrow2::array::{Array, Int32Array};
use arrow2::datatypes::{DataType, Field, Schema};
use arrow2::chunk::Chunk;
use arrow2::io::parquet::write::{Encoding, WriteOptions, CompressionOptions, Version};
let schema = Schema::from(vec![
Field::new("values", DataType::Int32, true),
]);
let encoding = vec![vec![Encoding::Plain]];
let options = WriteOptions {
write_statistics: true,
compression: CompressionOptions::Uncompressed,
version: Version::V2,
data_pagesize_limit: None,
};
let mut buffer = vec![];
let mut sink = FileSink::try_new(
&mut buffer,
schema,
encoding,
options,
)?;
for i in 0..3 {
let values = Int32Array::from(&[Some(i), None]);
let chunk = Chunk::new(vec![values.boxed()]);
sink.feed(chunk).await?;
}
sink.metadata.insert(String::from("key"), Some(String::from("value")));
sink.close().await?;
Fields§
§metadata: AHashMap<String, Option<String>>
Key-value metadata that will be written to the file on close.
Implementations§
source§impl<'a, W> FileSink<'a, W>
impl<'a, W> FileSink<'a, W>
sourcepub fn try_new(
writer: W,
schema: Schema,
encodings: Vec<Vec<Encoding>>,
options: WriteOptions
) -> Result<Self, Error>
pub fn try_new( writer: W, schema: Schema, encodings: Vec<Vec<Encoding>>, options: WriteOptions ) -> Result<Self, Error>
Create a new sink that writes arrays to the provided writer
.
§Error
Iff
- the Arrow schema can’t be converted to a valid Parquet schema.
- the length of the encodings is different from the number of fields in schema
sourcepub fn parquet_schema(&self) -> &SchemaDescriptor
pub fn parquet_schema(&self) -> &SchemaDescriptor
The Parquet SchemaDescriptor
for the file.
sourcepub fn options(&self) -> &WriteOptions
pub fn options(&self) -> &WriteOptions
The write options for the file.
Trait Implementations§
source§impl<'a, W> Sink<Chunk<Box<dyn Array>>> for FileSink<'a, W>
impl<'a, W> Sink<Chunk<Box<dyn Array>>> for FileSink<'a, W>
source§fn start_send(
self: Pin<&mut Self>,
item: Chunk<Box<dyn Array>>
) -> Result<(), Self::Error>
fn start_send( self: Pin<&mut Self>, item: Chunk<Box<dyn Array>> ) -> Result<(), Self::Error>
Begin the process of sending a value to the sink.
Each call to this function must be preceded by a successful call to
poll_ready
which returned Poll::Ready(Ok(()))
. Read moresource§fn poll_ready(
self: Pin<&mut Self>,
cx: &mut Context<'_>
) -> Poll<Result<(), Self::Error>>
fn poll_ready( self: Pin<&mut Self>, cx: &mut Context<'_> ) -> Poll<Result<(), Self::Error>>
Attempts to prepare the
Sink
to receive a value. Read moreAuto Trait Implementations§
impl<'a, W> Freeze for FileSink<'a, W>where
W: Freeze,
impl<'a, W> !RefUnwindSafe for FileSink<'a, W>
impl<'a, W> Send for FileSink<'a, W>
impl<'a, W> !Sync for FileSink<'a, W>
impl<'a, W> Unpin for FileSink<'a, W>
impl<'a, W> !UnwindSafe for FileSink<'a, W>
Blanket Implementations§
source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
source§impl<T, Item> SinkExt<Item> for T
impl<T, Item> SinkExt<Item> for T
source§fn with<U, Fut, F, E>(self, f: F) -> With<Self, Item, U, Fut, F>
fn with<U, Fut, F, E>(self, f: F) -> With<Self, Item, U, Fut, F>
Composes a function in front of the sink. Read more
source§fn with_flat_map<U, St, F>(self, f: F) -> WithFlatMap<Self, Item, U, St, F>
fn with_flat_map<U, St, F>(self, f: F) -> WithFlatMap<Self, Item, U, St, F>
Composes a function in front of the sink. Read more
source§fn sink_map_err<E, F>(self, f: F) -> SinkMapErr<Self, F>
fn sink_map_err<E, F>(self, f: F) -> SinkMapErr<Self, F>
Transforms the error returned by the sink.
source§fn sink_err_into<E>(self) -> SinkErrInto<Self, Item, E>
fn sink_err_into<E>(self) -> SinkErrInto<Self, Item, E>
Map this sink’s error to a different error type using the
Into
trait. Read moresource§fn buffer(self, capacity: usize) -> Buffer<Self, Item>where
Self: Sized,
fn buffer(self, capacity: usize) -> Buffer<Self, Item>where
Self: Sized,
Adds a fixed-size buffer to the current sink. Read more
source§fn flush(&mut self) -> Flush<'_, Self, Item>where
Self: Unpin,
fn flush(&mut self) -> Flush<'_, Self, Item>where
Self: Unpin,
Flush the sink, processing all pending items. Read more
source§fn send(&mut self, item: Item) -> Send<'_, Self, Item>where
Self: Unpin,
fn send(&mut self, item: Item) -> Send<'_, Self, Item>where
Self: Unpin,
A future that completes after the given item has been fully processed
into the sink, including flushing. Read more
source§fn feed(&mut self, item: Item) -> Feed<'_, Self, Item>where
Self: Unpin,
fn feed(&mut self, item: Item) -> Feed<'_, Self, Item>where
Self: Unpin,
A future that completes after the given item has been received
by the sink. Read more
source§fn send_all<'a, St>(&'a mut self, stream: &'a mut St) -> SendAll<'a, Self, St>
fn send_all<'a, St>(&'a mut self, stream: &'a mut St) -> SendAll<'a, Self, St>
A future that completes after the given stream has been fully processed
into the sink, including flushing. Read more
source§fn right_sink<Si1>(self) -> Either<Si1, Self>
fn right_sink<Si1>(self) -> Either<Si1, Self>
source§fn poll_ready_unpin(
&mut self,
cx: &mut Context<'_>
) -> Poll<Result<(), Self::Error>>where
Self: Unpin,
fn poll_ready_unpin(
&mut self,
cx: &mut Context<'_>
) -> Poll<Result<(), Self::Error>>where
Self: Unpin,
A convenience method for calling
Sink::poll_ready
on Unpin
sink types.source§fn start_send_unpin(&mut self, item: Item) -> Result<(), Self::Error>where
Self: Unpin,
fn start_send_unpin(&mut self, item: Item) -> Result<(), Self::Error>where
Self: Unpin,
A convenience method for calling
Sink::start_send
on Unpin
sink types.