public abstract class CrunchTool extends org.apache.hadoop.conf.Configured implements org.apache.hadoop.util.Tool, Serializable
Tool
interface that creates a Pipeline
instance and provides methods for working with the Pipeline from inside of
the Tool's run method.Constructor and Description |
---|
CrunchTool() |
CrunchTool(boolean inMemory) |
Modifier and Type | Method and Description |
---|---|
PipelineResult |
done() |
void |
enableDebug() |
org.apache.hadoop.conf.Configuration |
getConf() |
<T> Iterable<T> |
materialize(PCollection<T> pcollection) |
<T> PCollection<T> |
read(Source<T> source) |
<K,V> PTable<K,V> |
read(TableSource<K,V> tableSource) |
PCollection<String> |
readTextFile(String pathName) |
PipelineResult |
run() |
PipelineExecution |
runAsync() |
void |
setConf(org.apache.hadoop.conf.Configuration conf) |
void |
write(PCollection<?> pcollection,
Target target) |
void |
writeTextFile(PCollection<?> pcollection,
String pathName) |
public void setConf(org.apache.hadoop.conf.Configuration conf)
setConf
in interface org.apache.hadoop.conf.Configurable
setConf
in class org.apache.hadoop.conf.Configured
public org.apache.hadoop.conf.Configuration getConf()
getConf
in interface org.apache.hadoop.conf.Configurable
getConf
in class org.apache.hadoop.conf.Configured
public void enableDebug()
public <T> PCollection<T> read(Source<T> source)
public <K,V> PTable<K,V> read(TableSource<K,V> tableSource)
public PCollection<String> readTextFile(String pathName)
public void write(PCollection<?> pcollection, Target target)
public void writeTextFile(PCollection<?> pcollection, String pathName)
public <T> Iterable<T> materialize(PCollection<T> pcollection)
public PipelineResult run()
public PipelineExecution runAsync()
public PipelineResult done()
Copyright © 2016 The Apache Software Foundation. All rights reserved.