public abstract class VectorMapJoinCommonOperator extends MapJoinOperator implements VectorizationContextRegion
Operator.OperatorFunc, Operator.State
firstSmallTable, hashMapRowGetters, loader, mapJoinTables, spilledMapJoinTables
emptyList, joinKeys, joinKeysObjectInspectors, posBigTable
alias, aliasFilterTags, condn, countAfterReport, dummyObj, dummyObjVectors, filterMaps, filterTags, forwardCache, heartbeatInterval, intermediate, joinFilterObjectInspectors, joinFilters, joinValues, joinValuesObjectInspectors, joinValuesStandardObjectInspectors, needsPostEvaluation, noOuterJoin, NOTSKIPBIGTABLE, nullsafes, numAliases, offsets, order, residualJoinFilters, residualJoinFiltersOIs, rowContainerPostFilteredOuterJoin, rowContainerStandardObjectInspectors, skipVectors, spillTableDesc, totalSz
abortOp, asyncInitOperations, cContext, childOperators, childOperatorsArray, childOperatorsTag, colExprMap, conf, CONTEXT_NAME_KEY, done, groupKeyObject, HIVECOUNTERCREATEDFILES, HIVECOUNTERFATAL, id, indexForTezUnion, inputObjInspectors, isLogDebugEnabled, isLogInfoEnabled, isLogTraceEnabled, operatorId, out, outputObjInspector, parentOperators, PLOG, reporter, runTimeNumRows, state, statsMap
Modifier | Constructor and Description |
---|---|
protected |
VectorMapJoinCommonOperator()
Kryo ctor.
|
|
VectorMapJoinCommonOperator(CompilationOpContext ctx) |
|
VectorMapJoinCommonOperator(CompilationOpContext ctx,
VectorizationContext vContext,
OperatorDesc conf) |
Modifier and Type | Method and Description |
---|---|
protected void |
commonSetup(org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch batch) |
protected void |
completeInitializationOp(Object[] os)
This method can be used to retrieve the results from async operations
started at init time - before the operator pipeline is started.
|
protected void |
determineCommonInfo(boolean isOuter) |
protected void |
displayBatchColumns(org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch batch,
String batchName) |
protected HashTableLoader |
getHashTableLoader(org.apache.hadoop.conf.Configuration hconf)
This override lets us substitute our own fast vectorized hash table loader.
|
protected abstract String |
getLoggingPrefix() |
protected String |
getLoggingPrefix(String className) |
VectorizationContext |
getOuputVectorizationContext() |
OperatorType |
getType()
Return the type of the specific operator among the
types in OperatorType.
|
protected void |
initializeOp(org.apache.hadoop.conf.Configuration hconf)
Operator specific initialization.
|
protected void |
initLoggingPrefix(String className) |
protected org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch |
setupOverflowBatch() |
protected void |
setupVOutContext(List<String> outputColumnNames)
Setup the vectorized row batch description of the output of the native vectorized map join
operator.
|
canSkipJoinProcessing, canSkipReload, cleanUpInputFileChangedOp, closeOp, endGroup, generateMapMetaData, getName, getOperatorName, getRefKey, getValueObjectInspectors, isInputFileChangeSensitive, loadHashTable, process, reloadHashTable, reProcessBigTable, setMapJoinKey, spillBigTableRow, startGroup
checkAndGenObject, getFilteredValue, getFilterTag, getNextSize, getPosToAliasMap, hasFilter, internalForward, opAllowedAfterMapJoin, opAllowedBeforeMapJoin, reportProgress, setPosToAliasMap
abort, acceptLimitPushdown, allInitializedParentsAreClosed, areAllParentsInitialized, augmentPlan, cleanUpInputFileChanged, clone, cloneOp, cloneRecursiveChildren, close, columnNamesRowResolvedCanBeObtained, createDummy, defaultEndGroup, defaultStartGroup, dump, dump, flush, forward, getAdditionalCounters, getChildOperators, getChildren, getColumnExprMap, getCompilationOpContext, getConf, getConfiguration, getDone, getExecContext, getGroupKeyObject, getIdentifier, getIndexForTezUnion, getInputObjInspectors, getIsReduceSink, getNextCntr, getNumChild, getNumParent, getOperatorId, getOpTraits, getOutputObjInspector, getParentOperators, getReduceOutputName, getSchema, getStatistics, getStats, initEvaluators, initEvaluators, initEvaluatorsAndReturnStruct, initialize, initialize, initializeChildren, initializeLocalWork, initOperatorId, isUseBucketizedHiveInputFormat, jobClose, jobCloseOp, logStats, opAllowedBeforeSortMergeJoin, opAllowedConvertMapJoin, passExecContext, preorderMap, processGroup, removeChild, removeChildAndAdoptItsChildren, removeParent, removeParents, replaceChild, replaceParent, reset, resetStats, setAlias, setChildOperators, setColumnExprMap, setCompilationOpContext, setConf, setDone, setExecContext, setGroupKeyObject, setId, setIndexForTezUnion, setInputContext, setInputObjInspectors, setOperatorId, setOpTraits, setOutputCollector, setParentOperators, setReporter, setSchema, setStatistics, setUseBucketizedHiveInputFormat, supportAutomaticSortMergeJoin, supportSkewJoinOptimization, supportUnionRemoveOptimization, toString, toString
protected transient String loggingPrefix
protected VectorMapJoinDesc vectorDesc
protected VectorMapJoinInfo vectorMapJoinInfo
protected boolean isOuterJoin
protected byte posSingleVectorMapJoinSmallTable
protected VectorizationContext vContext
protected VectorizationContext vOutContext
protected int[] outputProjection
protected TypeInfo[] outputTypeInfos
protected VectorExpression[] bigTableFilterExpressions
protected VectorExpression[] bigTableKeyExpressions
protected VectorExpression[] bigTableValueExpressions
protected int[] bigTableKeyColumnMap
protected String[] bigTableKeyColumnNames
protected TypeInfo[] bigTableKeyTypeInfos
protected int[] bigTableValueColumnMap
protected String[] bigTableValueColumnNames
protected TypeInfo[] bigTableValueTypeInfos
protected VectorColumnOutputMapping bigTableRetainedMapping
protected VectorColumnOutputMapping bigTableOuterKeyMapping
protected VectorColumnSourceMapping smallTableMapping
protected VectorColumnSourceMapping projectionMapping
protected int[] smallTableOutputVectorColumns
protected int[] bigTableOuterKeyOutputVectorColumns
protected int[] bigTableByteColumnVectorColumns
protected int[] smallTableByteColumnVectorColumns
protected transient boolean useOverflowRepeatedThreshold
protected transient int overflowRepeatedThreshold
protected transient VectorCopyRow bigTableRetainedVectorCopy
protected transient VectorCopyRow bigTableVectorCopyOuterKeys
protected transient VectorDeserializeRow<LazyBinaryDeserializeRead> smallTableVectorDeserializeRow
protected transient org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch overflowBatch
protected transient org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch spillReplayBatch
protected transient boolean needCommonSetup
protected transient boolean needHashTableSetup
protected transient VectorMapJoinHashTable vectorMapJoinHashTable
protected VectorMapJoinCommonOperator()
public VectorMapJoinCommonOperator(CompilationOpContext ctx)
public VectorMapJoinCommonOperator(CompilationOpContext ctx, VectorizationContext vContext, OperatorDesc conf) throws HiveException
HiveException
protected abstract String getLoggingPrefix()
protected void initLoggingPrefix(String className)
protected void determineCommonInfo(boolean isOuter) throws HiveException
HiveException
protected void setupVOutContext(List<String> outputColumnNames)
protected HashTableLoader getHashTableLoader(org.apache.hadoop.conf.Configuration hconf)
getHashTableLoader
in class MapJoinOperator
protected void initializeOp(org.apache.hadoop.conf.Configuration hconf) throws HiveException
Operator
initializeOp
in class MapJoinOperator
HiveException
protected void completeInitializationOp(Object[] os) throws HiveException
Operator
completeInitializationOp
in class MapJoinOperator
HiveException
protected org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch setupOverflowBatch() throws HiveException
HiveException
protected void commonSetup(org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch batch) throws HiveException
HiveException
protected void displayBatchColumns(org.apache.hadoop.hive.ql.exec.vector.VectorizedRowBatch batch, String batchName)
public OperatorType getType()
Operator
getType
in class MapJoinOperator
public VectorizationContext getOuputVectorizationContext()
getOuputVectorizationContext
in interface VectorizationContextRegion
Copyright © 2021 The Apache Software Foundation. All rights reserved.