public class VectorizedPageIterator extends BasePageIterator
BasePageIterator.IntIterator
currentDL, currentRL, definitionLevels, desc, dictionary, hasNext, page, repetitionLevels, triplesCount, triplesRead, valueEncoding, values, writerVersion
Constructor and Description |
---|
VectorizedPageIterator(org.apache.parquet.column.ColumnDescriptor desc,
java.lang.String writerVersion,
boolean setValidityVector) |
Modifier and Type | Method and Description |
---|---|
protected void |
initDataReader(org.apache.parquet.column.Encoding dataEncoding,
org.apache.parquet.bytes.ByteBufferInputStream in,
int valueCount) |
protected void |
initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV1 dataPageV1,
org.apache.parquet.column.ColumnDescriptor desc,
org.apache.parquet.bytes.ByteBufferInputStream in,
int triplesCount) |
protected void |
initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV2 dataPageV2,
org.apache.parquet.column.ColumnDescriptor desc) |
int |
nextBatchBoolean(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder)
Method for reading batches of booleans.
|
int |
nextBatchDictionaryIds(org.apache.arrow.vector.IntVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder holder)
Method for reading a batch of dictionary ids from the dicitonary encoded data pages.
|
int |
nextBatchDoubles(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of DOUBLE data type
|
int |
nextBatchFixedLengthDecimal(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
Method for reading a batch of decimals backed by fixed length byte array parquet data type.
|
int |
nextBatchFixedWidthBinary(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder nullabilityHolder)
Method for reading batches of fixed width binary type (e.g.
|
int |
nextBatchFloats(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of FLOAT data type.
|
int |
nextBatchIntBackedDecimal(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder)
Method for reading a batch of decimals backed by INT32 and INT64 parquet data types.
|
int |
nextBatchIntegers(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of INT32 data type
|
int |
nextBatchLongBackedDecimal(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder) |
int |
nextBatchLongs(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of INT64 data type
|
int |
nextBatchTimestampMillis(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
int typeWidth,
NullabilityHolder holder)
Method for reading a batch of values of TIMESTAMP_MILLIS data type.
|
int |
nextBatchVarWidthType(org.apache.arrow.vector.FieldVector vector,
int expectedBatchSize,
int numValsInVector,
NullabilityHolder nullabilityHolder)
Method for reading a batch of variable width data type (ENUM, JSON, UTF8, BSON).
|
boolean |
producesDictionaryEncodedVector() |
protected void |
reset() |
void |
setAllPagesDictEncoded(boolean allDictEncoded) |
currentPageCount, hasNext, initFromPage, initFromPage, setDictionary, setPage
public VectorizedPageIterator(org.apache.parquet.column.ColumnDescriptor desc, java.lang.String writerVersion, boolean setValidityVector)
public void setAllPagesDictEncoded(boolean allDictEncoded)
protected void reset()
reset
in class BasePageIterator
public int nextBatchDictionaryIds(org.apache.arrow.vector.IntVector vector, int expectedBatchSize, int numValsInVector, NullabilityHolder holder)
public int nextBatchIntegers(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, int typeWidth, NullabilityHolder holder)
public int nextBatchLongs(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, int typeWidth, NullabilityHolder holder)
public int nextBatchTimestampMillis(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, int typeWidth, NullabilityHolder holder)
public int nextBatchFloats(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, int typeWidth, NullabilityHolder holder)
public int nextBatchDoubles(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, int typeWidth, NullabilityHolder holder)
public int nextBatchIntBackedDecimal(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, NullabilityHolder nullabilityHolder)
public int nextBatchLongBackedDecimal(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, NullabilityHolder nullabilityHolder)
public int nextBatchFixedLengthDecimal(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, int typeWidth, NullabilityHolder nullabilityHolder)
DecimalVector.setBigEndian(int, byte[])
method so that the data in Arrow vector is indeed little
endian.public int nextBatchVarWidthType(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, NullabilityHolder nullabilityHolder)
public int nextBatchFixedWidthBinary(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, int typeWidth, NullabilityHolder nullabilityHolder)
VarBinaryVector
in Arrow.public boolean producesDictionaryEncodedVector()
public int nextBatchBoolean(org.apache.arrow.vector.FieldVector vector, int expectedBatchSize, int numValsInVector, NullabilityHolder nullabilityHolder)
protected void initDataReader(org.apache.parquet.column.Encoding dataEncoding, org.apache.parquet.bytes.ByteBufferInputStream in, int valueCount)
initDataReader
in class BasePageIterator
protected void initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV1 dataPageV1, org.apache.parquet.column.ColumnDescriptor desc, org.apache.parquet.bytes.ByteBufferInputStream in, int triplesCount) throws java.io.IOException
initDefinitionLevelsReader
in class BasePageIterator
java.io.IOException
protected void initDefinitionLevelsReader(org.apache.parquet.column.page.DataPageV2 dataPageV2, org.apache.parquet.column.ColumnDescriptor desc)
initDefinitionLevelsReader
in class BasePageIterator