use std::convert::TryFrom;
use std::sync::Arc;
use arrow_format::flight::data::{FlightData, SchemaResult};
use arrow_format::ipc;
use crate::{
array::*,
datatypes::*,
error::{ArrowError, Result},
io::ipc::fb_to_schema,
io::ipc::read::read_record_batch,
io::ipc::write,
io::ipc::write::common::{encoded_batch, DictionaryTracker, EncodedData, IpcWriteOptions},
record_batch::RecordBatch,
};
pub fn serialize_batch(
batch: &RecordBatch,
options: &IpcWriteOptions,
) -> (Vec<FlightData>, FlightData) {
let mut dictionary_tracker = DictionaryTracker::new(false);
let (encoded_dictionaries, encoded_batch) =
encoded_batch(batch, &mut dictionary_tracker, options)
.expect("DictionaryTracker configured above to not error on replacement");
let flight_dictionaries = encoded_dictionaries.into_iter().map(Into::into).collect();
let flight_batch = encoded_batch.into();
(flight_dictionaries, flight_batch)
}
impl From<EncodedData> for FlightData {
fn from(data: EncodedData) -> Self {
FlightData {
data_header: data.ipc_message,
data_body: data.arrow_data,
..Default::default()
}
}
}
pub fn serialize_schema_to_result(schema: &Schema, options: &IpcWriteOptions) -> SchemaResult {
SchemaResult {
schema: schema_as_flatbuffer(schema, options),
}
}
pub fn serialize_schema(schema: &Schema, options: &IpcWriteOptions) -> FlightData {
let data_header = schema_as_flatbuffer(schema, options);
FlightData {
data_header,
..Default::default()
}
}
pub fn serialize_schema_to_info(schema: &Schema, options: &IpcWriteOptions) -> Result<Vec<u8>> {
let encoded_data = schema_as_encoded_data(schema, options);
let mut schema = vec![];
write::common::write_message(&mut schema, encoded_data, options)?;
Ok(schema)
}
fn schema_as_flatbuffer(schema: &Schema, options: &IpcWriteOptions) -> Vec<u8> {
let encoded_data = schema_as_encoded_data(schema, options);
encoded_data.ipc_message
}
fn schema_as_encoded_data(arrow_schema: &Schema, options: &IpcWriteOptions) -> EncodedData {
EncodedData {
ipc_message: write::schema_to_bytes(arrow_schema, *options.metadata_version()),
arrow_data: vec![],
}
}
fn schema_from_bytes(bytes: &[u8]) -> Result<Schema> {
if let Ok(ipc) = ipc::Message::root_as_message(bytes) {
if let Some((schema, _)) = ipc.header_as_schema().map(fb_to_schema) {
Ok(schema)
} else {
Err(ArrowError::Ipc("Unable to get head as schema".to_string()))
}
} else {
Err(ArrowError::Ipc("Unable to get root as message".to_string()))
}
}
impl TryFrom<&FlightData> for Schema {
type Error = ArrowError;
fn try_from(data: &FlightData) -> Result<Self> {
schema_from_bytes(&data.data_header[..]).map_err(|err| {
ArrowError::Ipc(format!(
"Unable to convert flight data to Arrow schema: {}",
err
))
})
}
}
impl TryFrom<&SchemaResult> for Schema {
type Error = ArrowError;
fn try_from(data: &SchemaResult) -> Result<Self> {
schema_from_bytes(&data.schema[..]).map_err(|err| {
ArrowError::Ipc(format!(
"Unable to convert schema result to Arrow schema: {}",
err
))
})
}
}
pub fn deserialize_batch(
data: &FlightData,
schema: Arc<Schema>,
is_little_endian: bool,
dictionaries_by_field: &[Option<Arc<dyn Array>>],
) -> Result<RecordBatch> {
let message = ipc::Message::root_as_message(&data.data_header[..])
.map_err(|err| ArrowError::Ipc(format!("Unable to get root as message: {:?}", err)))?;
let mut reader = std::io::Cursor::new(&data.data_body);
message
.header_as_record_batch()
.ok_or_else(|| {
ArrowError::Ipc("Unable to convert flight data header to a record batch".to_string())
})
.map(|batch| {
read_record_batch(
batch,
schema.clone(),
None,
is_little_endian,
dictionaries_by_field,
ipc::Schema::MetadataVersion::V5,
&mut reader,
0,
)
})?
}