public class MergeFileWork extends MapWork
MapWork.LlapIODescriptor, MapWork.MapExplainVectorization
BaseWork.BaseExplainVectorization
SAMPLING_ON_PREV_MR, SAMPLING_ON_START
inputFormatSupportSet, llapMode, supportRemovedReasons, supportSetInUse, uberMode, useVectorizedInputFileFormat, vectorizationEnabled, vectorizationExamined, vectorizedRowBatchCtx, vectorizedTestingReducerBatchSize, vectorizedVertexNum
colExprMap, memAvailable, memNeeded, opProps, opTraits, runtimeStatsTmpDir, statistics, vectorDesc, vectorMode
Constructor and Description |
---|
MergeFileWork(List<org.apache.hadoop.fs.Path> inputPaths,
org.apache.hadoop.fs.Path outputDir,
boolean hasDynamicPartitions,
String srcTblInputFormat,
TableDesc tbl) |
MergeFileWork(List<org.apache.hadoop.fs.Path> inputPaths,
org.apache.hadoop.fs.Path outputDir,
String srcTblInputFormat,
TableDesc tbl) |
addMapWork, addPathToAlias, addPathToAlias, addPathToPartitionInfo, configureJobConf, deriveExplainAttributes, deriveLlap, getAliases, getAliasToPartnInfo, getAliasToWork, getAllRootOperators, getAnyRootOperator, getBaseSrc, getBucketedColsByDirectory, getCacheAffinity, getDoSplitsGrouping, getDummyTableScan, getEventSourceColumnNameMap, getEventSourceColumnTypeMap, getEventSourcePartKeyExprMap, getEventSourceTableDescMap, getExecutionMode, getIncludedBuckets, getInputFormatSupportSet, getLlapIoDescString, getMapAliases, getMapExplainVectorization, getMaxSplitSize, getMinSplitSizePerNode, getMinSplitSizePerRack, getNameToSplitSample, getNotEnabledInputFileFormatReason, getNumMapTasks, getPartitionDescs, getPaths, getPathToAliases, getPathToPartitionInfo, getSamplingType, getSamplingTypeString, getSortedColsByDirectory, getSupportRemovedReasons, getSupportSetInUse, getTmpHDFSPath, getTmpPathForPartitionPruning, getTruncatedPathToAliases, getUseVectorizedInputFileFormat, getVectorizationEnabledConditionsMet, getVectorizationEnabledConditionsNotMet, getVectorizationInputFileFormatClassNameSet, getVectorizedRowBatch, getVectorPartitionDescList, getWorks, initialize, internTable, isInputFormatSorted, isLeftInputJoin, isMapperCannotSpanPartns, isMergeFromResolver, isUseBucketizedHiveInputFormat, mergeAliasedInput, mergingInto, removePathToAlias, removePathToPartitionInfo, replaceRoots, setAliasToPartnInfo, setAliasToWork, setBaseSrc, setDoSplitsGrouping, setDummyTableScan, setEventSourceColumnNameMap, setEventSourcePartKeyExprMap, setEventSourceTableDescMap, setIncludedBuckets, setInputformat, setInputFormatSorted, setInputFormatSupportSet, setIsMergeFromResolver, setLeftInputJoin, setMapAliases, setMapperCannotSpanPartns, setMaxSplitSize, setMinSplitSize, setMinSplitSizePerNode, setMinSplitSizePerRack, setNameToSplitSample, setNotEnabledInputFileFormatReason, setNumMapTasks, setPathToAliases, setPathToPartitionInfo, setSamplingType, setSupportRemovedReasons, setSupportSetInUse, setTmpHDFSPath, setTmpPathForPartitionPruning, setUseBucketizedHiveInputFormat, setUseVectorizedInputFileFormat, setVectorizationEnabledConditionsMet, setVectorizationEnabledConditionsNotMet, setVectorizationInputFileFormatClassNameSet, setVectorizedRowBatch, setVectorPartitionDescList
addDummyOp, addSortCols, getAllLeafOperators, getAllNative, getAllOperators, getDummyOps, getInputSourceToRuntimeValuesInfo, getIsTestForcedVectorizationEnable, getIsTestVectorizationSuppressExplainExecutionMode, getLlapMode, getMapRedLocalWork, getName, getNotVectorizedReason, getReservedMemoryMB, getSortCols, getTag, getUberMode, getUsesVectorUDFAdaptor, getVectorizationEnabled, getVectorizationExamined, getVectorizedRowBatchCtx, getVectorizedTestingReducerBatchSize, getVectorizedVertexNum, setAllNative, setDummyOps, setGatheringStats, setInputSourceToRuntimeValuesInfo, setIsTestForcedVectorizationEnable, setIsTestVectorizationSuppressExplainExecutionMode, setLlapMode, setMapRedLocalWork, setName, setNotVectorizedReason, setReservedMemoryMB, setTag, setUberMode, setUsesVectorUDFAdaptor, setVectorizationEnabled, setVectorizationExamined, setVectorizedRowBatchCtx, setVectorizedTestingReducerBatchSize, setVectorizedVertexNum
clone, fillSignature, getColumnExprMap, getColumnExprMapForExplain, getMaxMemoryAvailable, getMemoryNeeded, getOpProps, getRuntimeStatsTmpDir, getStatistics, getTraits, getUserLevelStatistics, getVectorDesc, getVectorMode, isSame, setColumnExprMap, setMaxMemoryAvailable, setMemoryNeeded, setOpProps, setRuntimeStatsTmpDir, setStatistics, setTraits, setVectorDesc, setVectorMode
public MergeFileWork(List<org.apache.hadoop.fs.Path> inputPaths, org.apache.hadoop.fs.Path outputDir, String srcTblInputFormat, TableDesc tbl)
public List<org.apache.hadoop.fs.Path> getInputPaths()
public void setInputPaths(List<org.apache.hadoop.fs.Path> inputPaths)
public org.apache.hadoop.fs.Path getOutputDir()
public void setOutputDir(org.apache.hadoop.fs.Path outputDir)
public Long getMinSplitSize()
getMinSplitSize
in class MapWork
public String getInputformat()
getInputformat
in class MapWork
public Class<? extends org.apache.hadoop.mapred.InputFormat> getInputformatClass()
public boolean isGatheringStats()
isGatheringStats
in class BaseWork
public boolean hasDynamicPartitions()
public void setHasDynamicPartitions(boolean hasDynamicPartitions)
public void resolveDynamicPartitionStoredAsSubDirsMerge(HiveConf conf, org.apache.hadoop.fs.Path path, TableDesc tblDesc, ArrayList<String> aliases, PartitionDesc partDesc)
resolveDynamicPartitionStoredAsSubDirsMerge
in class MapWork
public void resolveConcatenateMerge(HiveConf conf)
public ListBucketingCtx getListBucketingCtx()
public void setListBucketingCtx(ListBucketingCtx listBucketingCtx)
listBucketingCtx
- the listBucketingCtx to setpublic boolean isListBucketingAlterTableConcatenate()
public String getSourceTableInputFormat()
public void setSourceTableInputFormat(String srcTblInputFormat)
public String getMergeLevel()
Copyright © 2022 The Apache Software Foundation. All rights reserved.