Skip to content

Commit

Permalink
Merge branch 'remove-decimal-byte-array-converter' into remove-comple…
Browse files Browse the repository at this point in the history
…x-object-array-reader
  • Loading branch information
tustvold committed Aug 19, 2022
2 parents cd34e26 + 95ecb3c commit b810ec4
Show file tree
Hide file tree
Showing 15 changed files with 759 additions and 1,134 deletions.
93 changes: 10 additions & 83 deletions parquet/src/arrow/array_reader/builder.rs
Original file line number Diff line number Diff line change
Expand Up @@ -17,26 +17,20 @@

use std::sync::Arc;

use arrow::datatypes::{DataType, IntervalUnit, SchemaRef};
use arrow::datatypes::{DataType, SchemaRef};

use crate::arrow::array_reader::empty_array::make_empty_array_reader;
use crate::arrow::array_reader::fixed_len_byte_array::make_fixed_len_byte_array_reader;
use crate::arrow::array_reader::{
make_byte_array_dictionary_reader, make_byte_array_reader, ArrayReader,
ComplexObjectArrayReader, ListArrayReader, MapArrayReader, NullArrayReader,
PrimitiveArrayReader, RowGroupCollection, StructArrayReader,
};
use crate::arrow::buffer::converter::{
DecimalArrayConverter, DecimalByteArrayConvert, DecimalFixedLengthByteArrayConverter,
FixedLenBinaryConverter, FixedSizeArrayConverter, IntervalDayTimeArrayConverter,
IntervalDayTimeConverter, IntervalYearMonthArrayConverter,
IntervalYearMonthConverter,
ListArrayReader, MapArrayReader, NullArrayReader, PrimitiveArrayReader,
RowGroupCollection, StructArrayReader,
};
use crate::arrow::schema::{convert_schema, ParquetField, ParquetFieldType};
use crate::arrow::ProjectionMask;
use crate::basic::Type as PhysicalType;
use crate::data_type::{
BoolType, ByteArrayType, DoubleType, FixedLenByteArrayType, FloatType, Int32Type,
Int64Type, Int96Type,
BoolType, DoubleType, FloatType, Int32Type, Int64Type, Int96Type,
};
use crate::errors::Result;
use crate::schema::types::{ColumnDescriptor, ColumnPath, Type};
Expand Down Expand Up @@ -127,14 +121,12 @@ fn build_primitive_reader(
field: &ParquetField,
row_groups: &dyn RowGroupCollection,
) -> Result<Box<dyn ArrayReader>> {
let (col_idx, primitive_type, type_len) = match &field.field_type {
let (col_idx, primitive_type) = match &field.field_type {
ParquetFieldType::Primitive {
col_idx,
primitive_type,
} => match primitive_type.as_ref() {
Type::PrimitiveType { type_length, .. } => {
(*col_idx, primitive_type.clone(), *type_length)
}
Type::PrimitiveType { .. } => (*col_idx, primitive_type.clone()),
Type::GroupType { .. } => unreachable!(),
},
_ => unreachable!(),
Expand Down Expand Up @@ -202,76 +194,11 @@ fn build_primitive_reader(
Some(DataType::Dictionary(_, _)) => {
make_byte_array_dictionary_reader(page_iterator, column_desc, arrow_type)
}
Some(DataType::Decimal128(precision, scale)) => {
// read decimal data from parquet binary physical type
let convert = DecimalByteArrayConvert::new(DecimalArrayConverter::new(
precision as i32,
scale as i32,
));
Ok(Box::new(ComplexObjectArrayReader::<
ByteArrayType,
DecimalByteArrayConvert,
>::new(
page_iterator, column_desc, convert, arrow_type
)?))
}
_ => make_byte_array_reader(page_iterator, column_desc, arrow_type),
},
PhysicalType::FIXED_LEN_BYTE_ARRAY => match field.arrow_type {
DataType::Decimal128(precision, scale) => {
let converter = DecimalFixedLengthByteArrayConverter::new(
DecimalArrayConverter::new(precision as i32, scale as i32),
);
Ok(Box::new(ComplexObjectArrayReader::<
FixedLenByteArrayType,
DecimalFixedLengthByteArrayConverter,
>::new(
page_iterator,
column_desc,
converter,
arrow_type,
)?))
}
DataType::Interval(IntervalUnit::DayTime) => {
let converter =
IntervalDayTimeConverter::new(IntervalDayTimeArrayConverter {});
Ok(Box::new(ComplexObjectArrayReader::<
FixedLenByteArrayType,
_,
>::new(
page_iterator,
column_desc,
converter,
arrow_type,
)?))
}
DataType::Interval(IntervalUnit::YearMonth) => {
let converter =
IntervalYearMonthConverter::new(IntervalYearMonthArrayConverter {});
Ok(Box::new(ComplexObjectArrayReader::<
FixedLenByteArrayType,
_,
>::new(
page_iterator,
column_desc,
converter,
arrow_type,
)?))
}
_ => {
let converter =
FixedLenBinaryConverter::new(FixedSizeArrayConverter::new(type_len));
Ok(Box::new(ComplexObjectArrayReader::<
FixedLenByteArrayType,
FixedLenBinaryConverter,
>::new(
page_iterator,
column_desc,
converter,
arrow_type,
)?))
}
},
PhysicalType::FIXED_LEN_BYTE_ARRAY => {
make_fixed_len_byte_array_reader(page_iterator, column_desc, arrow_type)
}
}
}

Expand Down
Loading

0 comments on commit b810ec4

Please sign in to comment.