public class MapWork extends BaseWork
Modifier and Type | Field and Description |
---|---|
static int |
SAMPLING_ON_PREV_MR |
static int |
SAMPLING_ON_START |
Constructor and Description |
---|
MapWork() |
Modifier and Type | Method and Description |
---|---|
void |
addIndexIntermediateFile(java.lang.String fileName) |
void |
addMapWork(java.lang.String path,
java.lang.String alias,
Operator<?> work,
PartitionDesc pd) |
void |
configureJobConf(JobConf job) |
void |
deriveExplainAttributes()
Derive additional attributes to be rendered by EXPLAIN.
|
java.util.ArrayList<java.lang.String> |
getAliases() |
java.util.LinkedHashMap<java.lang.String,PartitionDesc> |
getAliasToPartnInfo() |
java.util.LinkedHashMap<java.lang.String,Operator<? extends OperatorDesc>> |
getAliasToWork() |
protected java.util.List<Operator<?>> |
getAllRootOperators() |
java.util.Map<java.lang.String,java.util.List<BucketingSortingCtx.BucketCol>> |
getBucketedColsByDirectory() |
boolean |
getHadoopSupportsSplittable() |
java.lang.String |
getIndexIntermediateFile() |
java.lang.String |
getInputformat() |
QBJoinTree |
getJoinTree() |
MapredLocalWork |
getMapLocalWork() |
java.lang.Long |
getMaxSplitSize() |
java.lang.Long |
getMinSplitSize() |
java.lang.Long |
getMinSplitSizePerNode() |
java.lang.Long |
getMinSplitSizePerRack() |
java.util.HashMap<java.lang.String,SplitSample> |
getNameToSplitSample() |
java.lang.Integer |
getNumMapTasks() |
java.util.LinkedHashMap<Operator<? extends OperatorDesc>,OpParseContext> |
getOpParseCtxMap() |
java.util.ArrayList<PartitionDesc> |
getPartitionDescs() |
java.util.ArrayList<java.lang.String> |
getPaths() |
java.util.LinkedHashMap<java.lang.String,java.util.ArrayList<java.lang.String>> |
getPathToAliases() |
java.util.LinkedHashMap<java.lang.String,PartitionDesc> |
getPathToPartitionInfo() |
int |
getSamplingType() |
java.lang.String |
getSamplingTypeString() |
java.util.Map<java.lang.String,java.util.List<BucketingSortingCtx.SortCol>> |
getSortedColsByDirectory() |
java.lang.String |
getTmpHDFSFileURI() |
java.util.Map<java.lang.String,java.util.ArrayList<java.lang.String>> |
getTruncatedPathToAliases()
This is used to display and verify output of "Path -> Alias" in test framework.
|
java.util.ArrayList<Operator<?>> |
getWorks() |
void |
initialize() |
boolean |
isInputFormatSorted() |
boolean |
isMapperCannotSpanPartns() |
boolean |
isUseBucketizedHiveInputFormat() |
void |
mergeAliasedInput(java.lang.String alias,
java.lang.String pathDir,
PartitionDesc partitionInfo) |
void |
mergingInto(MapWork mapWork) |
void |
resolveDynamicPartitionStoredAsSubDirsMerge(HiveConf conf,
Path path,
TableDesc tblDesc,
java.util.ArrayList<java.lang.String> aliases,
PartitionDesc partDesc) |
void |
setAliasToPartnInfo(java.util.LinkedHashMap<java.lang.String,PartitionDesc> aliasToPartnInfo) |
void |
setAliasToWork(java.util.LinkedHashMap<java.lang.String,Operator<? extends OperatorDesc>> aliasToWork) |
void |
setHadoopSupportsSplittable(boolean hadoopSupportsSplittable) |
void |
setInputformat(java.lang.String inputformat) |
void |
setInputFormatSorted(boolean inputFormatSorted) |
void |
setJoinTree(QBJoinTree joinTree) |
void |
setMapLocalWork(MapredLocalWork mapLocalWork) |
void |
setMapperCannotSpanPartns(boolean mapperCannotSpanPartns) |
void |
setMaxSplitSize(java.lang.Long maxSplitSize) |
void |
setMinSplitSize(java.lang.Long minSplitSize) |
void |
setMinSplitSizePerNode(java.lang.Long minSplitSizePerNode) |
void |
setMinSplitSizePerRack(java.lang.Long minSplitSizePerRack) |
void |
setNameToSplitSample(java.util.HashMap<java.lang.String,SplitSample> nameToSplitSample) |
void |
setNumMapTasks(java.lang.Integer numMapTasks) |
void |
setOpParseCtxMap(java.util.LinkedHashMap<Operator<? extends OperatorDesc>,OpParseContext> opParseCtxMap) |
void |
setPathToAliases(java.util.LinkedHashMap<java.lang.String,java.util.ArrayList<java.lang.String>> pathToAliases) |
void |
setPathToPartitionInfo(java.util.LinkedHashMap<java.lang.String,PartitionDesc> pathToPartitionInfo) |
void |
setSamplingType(int samplingType) |
void |
setTmpHDFSFileURI(java.lang.String tmpHDFSFileURI) |
void |
setUseBucketizedHiveInputFormat(boolean useBucketizedHiveInputFormat) |
getAllOperators, isGatheringStats, setGatheringStats
clone
public static final int SAMPLING_ON_PREV_MR
public static final int SAMPLING_ON_START
public java.util.LinkedHashMap<java.lang.String,java.util.ArrayList<java.lang.String>> getPathToAliases()
public void setPathToAliases(java.util.LinkedHashMap<java.lang.String,java.util.ArrayList<java.lang.String>> pathToAliases)
public java.util.Map<java.lang.String,java.util.ArrayList<java.lang.String>> getTruncatedPathToAliases()
public java.util.LinkedHashMap<java.lang.String,PartitionDesc> getPathToPartitionInfo()
public void setPathToPartitionInfo(java.util.LinkedHashMap<java.lang.String,PartitionDesc> pathToPartitionInfo)
public void deriveExplainAttributes()
public java.util.LinkedHashMap<java.lang.String,PartitionDesc> getAliasToPartnInfo()
public void setAliasToPartnInfo(java.util.LinkedHashMap<java.lang.String,PartitionDesc> aliasToPartnInfo)
aliasToPartnInfo
- the aliasToPartnInfo to setpublic java.util.LinkedHashMap<java.lang.String,Operator<? extends OperatorDesc>> getAliasToWork()
public void setAliasToWork(java.util.LinkedHashMap<java.lang.String,Operator<? extends OperatorDesc>> aliasToWork)
public MapredLocalWork getMapLocalWork()
public void setMapLocalWork(MapredLocalWork mapLocalWork)
mapLocalWork
- the mapredLocalWork to setpublic java.util.HashMap<java.lang.String,SplitSample> getNameToSplitSample()
public void setNameToSplitSample(java.util.HashMap<java.lang.String,SplitSample> nameToSplitSample)
public java.lang.Integer getNumMapTasks()
public void setNumMapTasks(java.lang.Integer numMapTasks)
public void addMapWork(java.lang.String path, java.lang.String alias, Operator<?> work, PartitionDesc pd)
public boolean isInputFormatSorted()
public void setInputFormatSorted(boolean inputFormatSorted)
public void resolveDynamicPartitionStoredAsSubDirsMerge(HiveConf conf, Path path, TableDesc tblDesc, java.util.ArrayList<java.lang.String> aliases, PartitionDesc partDesc)
protected java.util.List<Operator<?>> getAllRootOperators()
getAllRootOperators
in class BaseWork
public void mergeAliasedInput(java.lang.String alias, java.lang.String pathDir, PartitionDesc partitionInfo)
public void initialize()
public java.lang.Long getMaxSplitSize()
public void setMaxSplitSize(java.lang.Long maxSplitSize)
public java.lang.Long getMinSplitSize()
public void setMinSplitSize(java.lang.Long minSplitSize)
public java.lang.Long getMinSplitSizePerNode()
public void setMinSplitSizePerNode(java.lang.Long minSplitSizePerNode)
public java.lang.Long getMinSplitSizePerRack()
public void setMinSplitSizePerRack(java.lang.Long minSplitSizePerRack)
public java.lang.String getInputformat()
public void setInputformat(java.lang.String inputformat)
public boolean isUseBucketizedHiveInputFormat()
public void setUseBucketizedHiveInputFormat(boolean useBucketizedHiveInputFormat)
public QBJoinTree getJoinTree()
public void setJoinTree(QBJoinTree joinTree)
public void setMapperCannotSpanPartns(boolean mapperCannotSpanPartns)
public boolean isMapperCannotSpanPartns()
public boolean getHadoopSupportsSplittable()
public void setHadoopSupportsSplittable(boolean hadoopSupportsSplittable)
public java.lang.String getIndexIntermediateFile()
public java.util.ArrayList<java.lang.String> getAliases()
public java.util.ArrayList<Operator<?>> getWorks()
public java.util.ArrayList<java.lang.String> getPaths()
public java.util.ArrayList<PartitionDesc> getPartitionDescs()
public java.util.LinkedHashMap<Operator<? extends OperatorDesc>,OpParseContext> getOpParseCtxMap()
public void setOpParseCtxMap(java.util.LinkedHashMap<Operator<? extends OperatorDesc>,OpParseContext> opParseCtxMap)
public java.lang.String getTmpHDFSFileURI()
public void setTmpHDFSFileURI(java.lang.String tmpHDFSFileURI)
public void mergingInto(MapWork mapWork)
public java.util.Map<java.lang.String,java.util.List<BucketingSortingCtx.BucketCol>> getBucketedColsByDirectory()
public java.util.Map<java.lang.String,java.util.List<BucketingSortingCtx.SortCol>> getSortedColsByDirectory()
public void addIndexIntermediateFile(java.lang.String fileName)
public int getSamplingType()
public void setSamplingType(int samplingType)
public java.lang.String getSamplingTypeString()
public void configureJobConf(JobConf job)
Copyright © 2012 The Apache Software Foundation