Write Arrow
When compiled with feature io_ipc
, this crate can be used to write Arrow files.
An Arrow file is composed by a header, a footer, and blocks of RecordBatch
es.
The example below shows how to write RecordBatch
es:
use std::fs::File; use arrow2::array::{Array, Int32Array, Utf8Array}; use arrow2::chunk::Chunk; use arrow2::datatypes::{DataType, Field, Schema}; use arrow2::error::Result; use arrow2::io::ipc::write; fn write_batches(path: &str, schema: Schema, chunks: &[Chunk<Box<dyn Array>>]) -> Result<()> { let file = File::create(path)?; let options = write::WriteOptions { compression: None }; let mut writer = write::FileWriter::new(file, schema, None, options); writer.start()?; for chunk in chunks { writer.write(chunk, None)? } writer.finish() } fn main() -> Result<()> { use std::env; let args: Vec<String> = env::args().collect(); let file_path = &args[1]; // create a batch let schema = Schema::from(vec![ Field::new("a", DataType::Int32, false), Field::new("b", DataType::Utf8, false), ]); let a = Int32Array::from_slice(&[1, 2, 3, 4, 5]); let b = Utf8Array::<i32>::from_slice(&["a", "b", "c", "d", "e"]); let chunk = Chunk::try_new(vec![a.boxed(), b.boxed()])?; // write it write_batches(file_path, schema, &[chunk])?; Ok(()) }