public class MergeOnReadInputFormat extends org.apache.flink.api.common.io.RichInputFormat<org.apache.flink.table.data.RowData,MergeOnReadInputSplit>
Use ParquetRecordReader to read files instead of FSDataInputStream,
overrides createInputSplits(int) and close() to change the behaviors.
| Modifier and Type | Class and Description |
|---|---|
static class |
MergeOnReadInputFormat.Builder
Builder for
MergeOnReadInputFormat. |
protected static class |
MergeOnReadInputFormat.LogFileOnlyIterator |
protected static class |
MergeOnReadInputFormat.MergeIterator |
| Modifier and Type | Field and Description |
|---|---|
protected org.apache.flink.configuration.Configuration |
conf |
protected org.apache.hadoop.conf.Configuration |
hadoopConf |
protected MergeOnReadTableState |
tableState |
| Modifier | Constructor and Description |
|---|---|
protected |
MergeOnReadInputFormat(org.apache.flink.configuration.Configuration conf,
MergeOnReadTableState tableState,
List<org.apache.flink.table.types.DataType> fieldTypes,
String defaultPartName,
List<ExpressionPredicates.Predicate> predicates,
long limit,
boolean emitDelete,
InternalSchemaManager internalSchemaManager) |
| Modifier and Type | Method and Description |
|---|---|
static MergeOnReadInputFormat.Builder |
builder()
Returns the builder for
MergeOnReadInputFormat. |
void |
close() |
void |
configure(org.apache.flink.configuration.Configuration configuration) |
MergeOnReadInputSplit[] |
createInputSplits(int minNumSplits) |
protected ClosableIterator<org.apache.flink.table.data.RowData> |
getBaseFileIterator(String path) |
protected ClosableIterator<org.apache.flink.table.data.RowData> |
getBaseFileIteratorWithMetadata(String path) |
protected ClosableIterator<org.apache.flink.table.data.RowData> |
getFullLogFileIterator(MergeOnReadInputSplit split) |
org.apache.flink.core.io.InputSplitAssigner |
getInputSplitAssigner(MergeOnReadInputSplit[] mergeOnReadInputSplits) |
org.apache.flink.api.common.io.statistics.BaseStatistics |
getStatistics(org.apache.flink.api.common.io.statistics.BaseStatistics baseStatistics) |
protected ClosableIterator<org.apache.flink.table.data.RowData> |
initIterator(MergeOnReadInputSplit split) |
boolean |
isClosed() |
void |
isEmitDelete(boolean emitDelete) |
org.apache.flink.table.data.RowData |
nextRecord(org.apache.flink.table.data.RowData o) |
void |
open(MergeOnReadInputSplit split) |
boolean |
reachedEnd() |
protected final org.apache.flink.configuration.Configuration conf
protected transient org.apache.hadoop.conf.Configuration hadoopConf
protected final MergeOnReadTableState tableState
protected MergeOnReadInputFormat(org.apache.flink.configuration.Configuration conf,
MergeOnReadTableState tableState,
List<org.apache.flink.table.types.DataType> fieldTypes,
String defaultPartName,
List<ExpressionPredicates.Predicate> predicates,
long limit,
boolean emitDelete,
InternalSchemaManager internalSchemaManager)
public static MergeOnReadInputFormat.Builder builder()
MergeOnReadInputFormat.public void open(MergeOnReadInputSplit split) throws IOException
IOExceptionprotected ClosableIterator<org.apache.flink.table.data.RowData> initIterator(MergeOnReadInputSplit split) throws IOException
IOExceptionpublic void configure(org.apache.flink.configuration.Configuration configuration)
public org.apache.flink.api.common.io.statistics.BaseStatistics getStatistics(org.apache.flink.api.common.io.statistics.BaseStatistics baseStatistics)
public MergeOnReadInputSplit[] createInputSplits(int minNumSplits)
public org.apache.flink.core.io.InputSplitAssigner getInputSplitAssigner(MergeOnReadInputSplit[] mergeOnReadInputSplits)
public boolean reachedEnd()
throws IOException
IOExceptionpublic org.apache.flink.table.data.RowData nextRecord(org.apache.flink.table.data.RowData o)
public void close()
throws IOException
IOExceptionpublic boolean isClosed()
protected ClosableIterator<org.apache.flink.table.data.RowData> getBaseFileIteratorWithMetadata(String path)
protected ClosableIterator<org.apache.flink.table.data.RowData> getBaseFileIterator(String path) throws IOException
IOExceptionprotected ClosableIterator<org.apache.flink.table.data.RowData> getFullLogFileIterator(MergeOnReadInputSplit split)
@VisibleForTesting public void isEmitDelete(boolean emitDelete)
Copyright © 2023 The Apache Software Foundation. All rights reserved.