Package org.apache.parquet.column
Class ParquetProperties
- java.lang.Object
-
- org.apache.parquet.column.ParquetProperties
-
public class ParquetProperties extends Object
This class represents all the configurable Parquet properties.
-
-
Nested Class Summary
Nested Classes Modifier and Type Class Description static classParquetProperties.Builderstatic classParquetProperties.WriterVersion
-
Field Summary
Fields Modifier and Type Field Description static booleanDEFAULT_BLOOM_FILTER_ENABLEDstatic doubleDEFAULT_BLOOM_FILTER_FPPstatic intDEFAULT_COLUMN_INDEX_TRUNCATE_LENGTHstatic intDEFAULT_DICTIONARY_PAGE_SIZEstatic booleanDEFAULT_ESTIMATE_ROW_COUNT_FOR_PAGE_SIZE_CHECKstatic booleanDEFAULT_IS_BYTE_STREAM_SPLIT_ENABLEDstatic booleanDEFAULT_IS_DICTIONARY_ENABLEDstatic intDEFAULT_MAX_BLOOM_FILTER_BYTESstatic intDEFAULT_MAXIMUM_RECORD_COUNT_FOR_CHECKstatic intDEFAULT_MINIMUM_RECORD_COUNT_FOR_CHECKstatic intDEFAULT_PAGE_ROW_COUNT_LIMITstatic intDEFAULT_PAGE_SIZEstatic booleanDEFAULT_PAGE_WRITE_CHECKSUM_ENABLEDstatic intDEFAULT_STATISTICS_TRUNCATE_LENGTHstatic ValuesWriterFactoryDEFAULT_VALUES_WRITER_FACTORYstatic ParquetProperties.WriterVersionDEFAULT_WRITER_VERSION
-
Method Summary
-
-
-
Field Detail
-
DEFAULT_PAGE_SIZE
public static final int DEFAULT_PAGE_SIZE
- See Also:
- Constant Field Values
-
DEFAULT_DICTIONARY_PAGE_SIZE
public static final int DEFAULT_DICTIONARY_PAGE_SIZE
- See Also:
- Constant Field Values
-
DEFAULT_IS_DICTIONARY_ENABLED
public static final boolean DEFAULT_IS_DICTIONARY_ENABLED
- See Also:
- Constant Field Values
-
DEFAULT_IS_BYTE_STREAM_SPLIT_ENABLED
public static final boolean DEFAULT_IS_BYTE_STREAM_SPLIT_ENABLED
- See Also:
- Constant Field Values
-
DEFAULT_WRITER_VERSION
public static final ParquetProperties.WriterVersion DEFAULT_WRITER_VERSION
-
DEFAULT_ESTIMATE_ROW_COUNT_FOR_PAGE_SIZE_CHECK
public static final boolean DEFAULT_ESTIMATE_ROW_COUNT_FOR_PAGE_SIZE_CHECK
- See Also:
- Constant Field Values
-
DEFAULT_MINIMUM_RECORD_COUNT_FOR_CHECK
public static final int DEFAULT_MINIMUM_RECORD_COUNT_FOR_CHECK
- See Also:
- Constant Field Values
-
DEFAULT_MAXIMUM_RECORD_COUNT_FOR_CHECK
public static final int DEFAULT_MAXIMUM_RECORD_COUNT_FOR_CHECK
- See Also:
- Constant Field Values
-
DEFAULT_COLUMN_INDEX_TRUNCATE_LENGTH
public static final int DEFAULT_COLUMN_INDEX_TRUNCATE_LENGTH
- See Also:
- Constant Field Values
-
DEFAULT_STATISTICS_TRUNCATE_LENGTH
public static final int DEFAULT_STATISTICS_TRUNCATE_LENGTH
- See Also:
- Constant Field Values
-
DEFAULT_PAGE_ROW_COUNT_LIMIT
public static final int DEFAULT_PAGE_ROW_COUNT_LIMIT
- See Also:
- Constant Field Values
-
DEFAULT_MAX_BLOOM_FILTER_BYTES
public static final int DEFAULT_MAX_BLOOM_FILTER_BYTES
- See Also:
- Constant Field Values
-
DEFAULT_BLOOM_FILTER_ENABLED
public static final boolean DEFAULT_BLOOM_FILTER_ENABLED
- See Also:
- Constant Field Values
-
DEFAULT_BLOOM_FILTER_FPP
public static final double DEFAULT_BLOOM_FILTER_FPP
- See Also:
- Constant Field Values
-
DEFAULT_PAGE_WRITE_CHECKSUM_ENABLED
public static final boolean DEFAULT_PAGE_WRITE_CHECKSUM_ENABLED
- See Also:
- Constant Field Values
-
DEFAULT_VALUES_WRITER_FACTORY
public static final ValuesWriterFactory DEFAULT_VALUES_WRITER_FACTORY
-
-
Method Detail
-
newRepetitionLevelWriter
public ValuesWriter newRepetitionLevelWriter(ColumnDescriptor path)
-
newDefinitionLevelWriter
public ValuesWriter newDefinitionLevelWriter(ColumnDescriptor path)
-
newRepetitionLevelEncoder
public RunLengthBitPackingHybridEncoder newRepetitionLevelEncoder(ColumnDescriptor path)
-
newDefinitionLevelEncoder
public RunLengthBitPackingHybridEncoder newDefinitionLevelEncoder(ColumnDescriptor path)
-
newValuesWriter
public ValuesWriter newValuesWriter(ColumnDescriptor path)
-
getPageSizeThreshold
public int getPageSizeThreshold()
-
getInitialSlabSize
public int getInitialSlabSize()
-
getDictionaryPageSizeThreshold
public int getDictionaryPageSizeThreshold()
-
getWriterVersion
public ParquetProperties.WriterVersion getWriterVersion()
-
isEnableDictionary
@Deprecated public boolean isEnableDictionary()
Deprecated.
-
isDictionaryEnabled
public boolean isDictionaryEnabled(ColumnDescriptor column)
-
isByteStreamSplitEnabled
public boolean isByteStreamSplitEnabled()
-
getAllocator
public org.apache.parquet.bytes.ByteBufferAllocator getAllocator()
-
newColumnWriteStore
public ColumnWriteStore newColumnWriteStore(MessageType schema, PageWriteStore pageStore)
-
newColumnWriteStore
public ColumnWriteStore newColumnWriteStore(MessageType schema, PageWriteStore pageStore, BloomFilterWriteStore bloomFilterWriteStore)
-
getMinRowCountForPageSizeCheck
public int getMinRowCountForPageSizeCheck()
-
getMaxRowCountForPageSizeCheck
public int getMaxRowCountForPageSizeCheck()
-
getValuesWriterFactory
public ValuesWriterFactory getValuesWriterFactory()
-
getColumnIndexTruncateLength
public int getColumnIndexTruncateLength()
-
getStatisticsTruncateLength
public int getStatisticsTruncateLength()
-
estimateNextSizeCheck
public boolean estimateNextSizeCheck()
-
getPageRowCountLimit
public int getPageRowCountLimit()
-
getPageWriteChecksumEnabled
public boolean getPageWriteChecksumEnabled()
-
getBloomFilterNDV
public OptionalLong getBloomFilterNDV(ColumnDescriptor column)
-
getBloomFilterFPP
public OptionalDouble getBloomFilterFPP(ColumnDescriptor column)
-
isBloomFilterEnabled
public boolean isBloomFilterEnabled(ColumnDescriptor column)
-
getMaxBloomFilterBytes
public int getMaxBloomFilterBytes()
-
builder
public static ParquetProperties.Builder builder()
-
copy
public static ParquetProperties.Builder copy(ParquetProperties toCopy)
-
-