public class VectorizedPageIterator extends BasePageIterator
BasePageIterator.IntIteratorcurrentDL, currentRL, definitionLevels, desc, dictionary, hasNext, page, repetitionLevels, triplesCount, triplesRead, valueEncoding, values, writerVersion| Constructor and Description |
|---|
VectorizedPageIterator(org.apache.parquet.column.ColumnDescriptor desc,
java.lang.String writerVersion,
boolean setValidityVector) |
| Modifier and Type | Method and Description |
|---|---|
protected void |
initDataReader(org.apache.parquet.column.Encoding dataEncoding,
org.apache.parquet.bytes.ByteBufferInputStream in,
int valueCount) |
protected void |
initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV1 dataPageV1,
org.apache.parquet.column.ColumnDescriptor desc,
org.apache.parquet.bytes.ByteBufferInputStream in,
int triplesCount) |
protected void |
initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV2 dataPageV2,
org.apache.parquet.column.ColumnDescriptor desc) |
int |
nextBatchBoolean(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder)
Method for reading batches of booleans.
|
int |
nextBatchDictionaryIds(org.apache.arrow.vector.IntVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder holder)
Method for reading a batch of dictionary ids from the dicitonary encoded data pages.
|
int |
nextBatchDoubles(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of DOUBLE data type
|
int |
nextBatchFixedLengthDecimal(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
Method for reading a batch of decimals backed by fixed length byte array parquet data type.
|
int |
nextBatchFixedWidthBinary(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
Method for reading batches of fixed width binary type (e.g.
|
int |
nextBatchFloats(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of FLOAT data type.
|
int |
nextBatchIntegers(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of INT32 data type
|
int |
nextBatchIntLongBackedDecimal(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
Method for reading a batch of decimals backed by INT32 and INT64 parquet data types.
|
int |
nextBatchLongs(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of INT64 data type
|
int |
nextBatchTimestampMillis(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of TIMESTAMP_MILLIS data type.
|
int |
nextBatchVarWidthType(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder)
Method for reading a batch of variable width data type (ENUM, JSON, UTF8, BSON).
|
protected void |
reset() |
void |
setAllPagesDictEncoded(boolean allDictEncoded) |
currentPageCount, hasNext, initFromPage, initFromPage, setDictionary, setPagepublic VectorizedPageIterator(org.apache.parquet.column.ColumnDescriptor desc,
java.lang.String writerVersion,
boolean setValidityVector)
public void setAllPagesDictEncoded(boolean allDictEncoded)
protected void reset()
reset in class BasePageIteratorpublic int nextBatchDictionaryIds(org.apache.arrow.vector.IntVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder holder)
public int nextBatchIntegers(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
public int nextBatchLongs(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
public int nextBatchTimestampMillis(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
public int nextBatchFloats(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
public int nextBatchDoubles(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
public int nextBatchIntLongBackedDecimal(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
public int nextBatchFixedLengthDecimal(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
DecimalVector.setBigEndian(int, byte[]) method so that the data in Arrow vector is indeed little
endian.public int nextBatchVarWidthType(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder)
public int nextBatchFixedWidthBinary(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
VarBinaryVector in Arrow.public int nextBatchBoolean(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder)
protected void initDataReader(org.apache.parquet.column.Encoding dataEncoding,
org.apache.parquet.bytes.ByteBufferInputStream in,
int valueCount)
initDataReader in class BasePageIteratorprotected void initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV1 dataPageV1,
org.apache.parquet.column.ColumnDescriptor desc,
org.apache.parquet.bytes.ByteBufferInputStream in,
int triplesCount)
throws java.io.IOException
initDefinitionLevelsReader in class BasePageIteratorjava.io.IOExceptionprotected void initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV2 dataPageV2,
org.apache.parquet.column.ColumnDescriptor desc)
initDefinitionLevelsReader in class BasePageIterator