A B C D E F G H I J K L M N O P Q R S T U V W

A

accept(T) - Method in class com.cloudera.crunch.FilterFn
If true, emit the given record.
accept(S) - Method in class com.cloudera.crunch.FilterFn.AndFn
 
accept(S) - Method in class com.cloudera.crunch.FilterFn.NotFn
 
accept(S) - Method in class com.cloudera.crunch.FilterFn.OrFn
 
accept(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
accept(OutputHandler, PType<?>) - Method in class com.cloudera.crunch.io.avro.AvroFileTarget
 
accept(OutputHandler, PType<?>) - Method in class com.cloudera.crunch.io.hbase.HBaseTarget
 
accept(OutputHandler, PType<?>) - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
accept(OutputHandler, PType<?>) - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
accept(OutputHandler, PType<?>) - Method in interface com.cloudera.crunch.Target
 
accept(Class<?>) - Method in class com.cloudera.crunch.type.avro.SafeAvroSerialization
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.DoCollectionImpl
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.DoTableImpl
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.InputTable
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.UnionCollection
 
acceptInternal(PCollectionImpl.Visitor) - Method in class com.cloudera.crunch.impl.mr.collect.UnionTable
 
addChild(DoNode) - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
addDependency(JobPrototype) - Method in class com.cloudera.crunch.impl.mr.plan.JobPrototype
 
addDependingJob(ControlledJob) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Add a job to this jobs' dependency list.
addInputPath(Job, Path, Class<? extends InputFormat>, int) - Static method in class com.cloudera.crunch.impl.mr.run.CrunchInputs
 
addJob(CrunchJob) - Method in class com.cloudera.crunch.impl.mr.exec.MRExecutor
 
addJob(ControlledJob) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
Add a new job.
addJobCollection(Collection<ControlledJob>) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
Add a collection of jobs
addNamedOutput(Job, String, Class<? extends OutputFormat>, Class<?>, Class<?>) - Static method in class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Adds a named output for the job.
addReducePaths(HashMultimap<Target, NodePath>) - Method in class com.cloudera.crunch.impl.mr.plan.JobPrototype
 
Aggregate - Class in com.cloudera.crunch.lib
Methods for performing various types of aggregations over PCollection instances.
Aggregate() - Constructor for class com.cloudera.crunch.lib.Aggregate
 
Aggregate.PairValueComparator<K,V> - Class in com.cloudera.crunch.lib
 
Aggregate.PairValueComparator(boolean) - Constructor for class com.cloudera.crunch.lib.Aggregate.PairValueComparator
 
Aggregate.TopKCombineFn<K,V> - Class in com.cloudera.crunch.lib
 
Aggregate.TopKCombineFn(int, boolean) - Constructor for class com.cloudera.crunch.lib.Aggregate.TopKCombineFn
 
Aggregate.TopKFn<K,V> - Class in com.cloudera.crunch.lib
 
Aggregate.TopKFn(int, boolean) - Constructor for class com.cloudera.crunch.lib.Aggregate.TopKFn
 
aggregator(CombineFn.Aggregator<V>) - Static method in class com.cloudera.crunch.CombineFn
 
AGGREGATOR_BUCKETS - Static variable in class com.cloudera.crunch.impl.mr.run.RuntimeParameters
 
aggregatorFactory(CombineFn.AggregatorFactory<V>) - Static method in class com.cloudera.crunch.CombineFn
 
allFinished() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
 
and(FilterFn<S>...) - Static method in class com.cloudera.crunch.FilterFn
 
as(PType<T>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
as(PType<T>) - Method in interface com.cloudera.crunch.type.PTypeFamily
Returns the equivalent of the given ptype for this family, if it exists.
as(PType<T>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
asSourceTarget(PType<T>) - Method in class com.cloudera.crunch.io.avro.AvroFileTarget
 
asSourceTarget(PType<T>) - Method in class com.cloudera.crunch.io.hbase.HBaseTarget
 
asSourceTarget(PType<T>) - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
asSourceTarget(PType<S>) - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
asSourceTarget(PType<T>) - Method in class com.cloudera.crunch.io.seq.SeqFileTarget
 
asSourceTarget(PType<T>) - Method in class com.cloudera.crunch.io.text.TextFileTarget
 
asSourceTarget(PType<T>) - Method in interface com.cloudera.crunch.Target
 
At - Class in com.cloudera.crunch.io
Static factory methods for creating various SourceTarget types.
At() - Constructor for class com.cloudera.crunch.io.At
 
at - Static variable in class com.cloudera.crunch.tool.CrunchTool
 
avroFile(String, AvroType<T>) - Static method in class com.cloudera.crunch.io.At
 
avroFile(Path, AvroType<T>) - Static method in class com.cloudera.crunch.io.At
 
avroFile(String, AvroType<T>) - Static method in class com.cloudera.crunch.io.From
 
avroFile(Path, AvroType<T>) - Static method in class com.cloudera.crunch.io.From
 
avroFile(String) - Static method in class com.cloudera.crunch.io.To
 
avroFile(Path) - Static method in class com.cloudera.crunch.io.To
 
AvroFileReaderFactory<T> - Class in com.cloudera.crunch.io.avro
 
AvroFileReaderFactory(AvroType<T>) - Constructor for class com.cloudera.crunch.io.avro.AvroFileReaderFactory
 
AvroFileSource<T> - Class in com.cloudera.crunch.io.avro
 
AvroFileSource(Path, AvroType<T>) - Constructor for class com.cloudera.crunch.io.avro.AvroFileSource
 
AvroFileSourceTarget<T> - Class in com.cloudera.crunch.io.avro
 
AvroFileSourceTarget(Path, AvroType<T>) - Constructor for class com.cloudera.crunch.io.avro.AvroFileSourceTarget
 
AvroFileTarget - Class in com.cloudera.crunch.io.avro
 
AvroFileTarget(String) - Constructor for class com.cloudera.crunch.io.avro.AvroFileTarget
 
AvroFileTarget(Path) - Constructor for class com.cloudera.crunch.io.avro.AvroFileTarget
 
AvroGroupedTableType<K,V> - Class in com.cloudera.crunch.type.avro
 
AvroGroupedTableType(AvroTableType<K, V>) - Constructor for class com.cloudera.crunch.type.avro.AvroGroupedTableType
 
AvroInputFormat<T> - Class in com.cloudera.crunch.type.avro
An InputFormat for Avro data files.
AvroInputFormat() - Constructor for class com.cloudera.crunch.type.avro.AvroInputFormat
 
AvroKeyConverter<K> - Class in com.cloudera.crunch.type.avro
 
AvroKeyConverter() - Constructor for class com.cloudera.crunch.type.avro.AvroKeyConverter
 
AvroOutputFormat<T> - Class in com.cloudera.crunch.type.avro
An OutputFormat for Avro data files.
AvroOutputFormat() - Constructor for class com.cloudera.crunch.type.avro.AvroOutputFormat
 
AvroPairConverter<K,V> - Class in com.cloudera.crunch.type.avro
 
AvroPairConverter() - Constructor for class com.cloudera.crunch.type.avro.AvroPairConverter
 
AvroRecordReader<T> - Class in com.cloudera.crunch.type.avro
An RecordReader for Avro data files.
AvroRecordReader(Schema) - Constructor for class com.cloudera.crunch.type.avro.AvroRecordReader
 
Avros - Class in com.cloudera.crunch.type.avro
Defines static methods that are analogous to the methods defined in AvroTypeFamily for convenient static importing.
AvroTableType<K,V> - Class in com.cloudera.crunch.type.avro
The implementation of the PTableType interface for Avro-based serialization.
AvroTableType(AvroType<K>, AvroType<V>, Class<Pair<K, V>>) - Constructor for class com.cloudera.crunch.type.avro.AvroTableType
 
AvroType<T> - Class in com.cloudera.crunch.type.avro
The implementation of the PType interface for Avro-based serialization.
AvroType(Class<T>, Schema, PType...) - Constructor for class com.cloudera.crunch.type.avro.AvroType
 
AvroType(Class<T>, Schema, MapFn, MapFn, PType...) - Constructor for class com.cloudera.crunch.type.avro.AvroType
 
AvroTypeFamily - Class in com.cloudera.crunch.type.avro
 
AvroUtf8InputFormat - Class in com.cloudera.crunch.type.avro
An InputFormat for text files.
AvroUtf8InputFormat() - Constructor for class com.cloudera.crunch.type.avro.AvroUtf8InputFormat
 

B

bigInt(PTypeFamily) - Static method in class com.cloudera.crunch.util.PTypes
 
BIGINT_TO_BYTE - Static variable in class com.cloudera.crunch.util.PTypes
 
booleans() - Static method in class com.cloudera.crunch.type.avro.Avros
 
booleans() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
booleans() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
booleans() - Static method in class com.cloudera.crunch.type.writable.Writables
 
booleans() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
bottom(int) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
bottom(int) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
bottom(int) - Method in interface com.cloudera.crunch.PTable
Returns a PTable made up of the pairs in this PTable with the smallest value field.
build() - Method in class com.cloudera.crunch.GroupingOptions.Builder
 
build() - Method in class com.cloudera.crunch.impl.mr.plan.JobNameBuilder
 
builder() - Static method in class com.cloudera.crunch.GroupingOptions
 
by(int, Sort.Order) - Static method in class com.cloudera.crunch.lib.Sort.ColumnOrder
 
BYTE_TO_BIGINT - Static variable in class com.cloudera.crunch.util.PTypes
 
bytes() - Static method in class com.cloudera.crunch.type.avro.Avros
 
bytes() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
bytes() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
bytes() - Static method in class com.cloudera.crunch.type.writable.Writables
 
bytes() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
BYTES_IN - Static variable in class com.cloudera.crunch.type.avro.Avros
 
BZip2TextInputFormat - Class in com.cloudera.crunch.io.text
 
BZip2TextInputFormat() - Constructor for class com.cloudera.crunch.io.text.BZip2TextInputFormat
 

C

CBZip2InputStream - Class in com.cloudera.crunch.io.text
An input stream that decompresses from the BZip2 format (without the file header chars) to be read as any other stream.
CBZip2InputStream(FSDataInputStream, int, long) - Constructor for class com.cloudera.crunch.io.text.CBZip2InputStream
 
checkRunningState() - Method in class com.cloudera.crunch.impl.mr.exec.CrunchJob
 
checkRunningState() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Check the state of this running job.
cleanup(Emitter<T>) - Method in class com.cloudera.crunch.DoFn
Called during the cleanup of the MapReduce job this DoFn is associated with.
cleanup(Mapper<Object, Object, Object, Object>.Context) - Method in class com.cloudera.crunch.impl.mr.run.CrunchMapper
 
cleanup(Reducer<Object, Object, Object, Object>.Context) - Method in class com.cloudera.crunch.impl.mr.run.CrunchReducer
 
cleanup() - Method in class com.cloudera.crunch.impl.mr.run.CrunchTaskContext
 
cleanup() - Method in class com.cloudera.crunch.impl.mr.run.RTNode
 
cleanup(Emitter<Pair<Boolean, Pair<K, V>>>) - Method in class com.cloudera.crunch.lib.Aggregate.TopKFn
 
clearCounters() - Static method in class com.cloudera.crunch.test.TestCounters
 
clearWritten(int) - Method in class com.cloudera.crunch.type.writable.TupleWritable
Record that the tuple does not contain an element at the position provided.
clearWritten() - Method in class com.cloudera.crunch.type.writable.TupleWritable
Clear any record of which writables have been written to, without releasing storage.
close() - Method in class com.cloudera.crunch.type.avro.AvroRecordReader
 
close() - Method in class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Closes all the opened outputs.
cogroup(PTable<K, U>) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
cogroup(PTable<K, U>) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
Cogroup - Class in com.cloudera.crunch.lib
 
Cogroup() - Constructor for class com.cloudera.crunch.lib.Cogroup
 
cogroup(PTable<K, U>, PTable<K, V>) - Static method in class com.cloudera.crunch.lib.Cogroup
Co-groups the two PTable arguments.
cogroup(PTable<K, U>) - Method in interface com.cloudera.crunch.PTable
Co-group operation with the given table on common keys.
collectionOf(T...) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
collectionOf(Iterable<T>) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
collections(PType<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
collections(PType<T>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
collections(PType<T>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
collections(PType<T>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
collections(PType<T>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
Collects - Class in com.cloudera.crunch.util
Utility functions for returning Collection objects backed by different types of implementations.
collectValues() - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
collectValues() - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
collectValues(PTable<K, V>) - Static method in class com.cloudera.crunch.lib.Aggregate
 
collectValues() - Method in interface com.cloudera.crunch.PTable
Aggregate all of the values with the same key into a single key-value pair in the returned PTable.
com.cloudera.crunch - package com.cloudera.crunch
 
com.cloudera.crunch.fn - package com.cloudera.crunch.fn
 
com.cloudera.crunch.impl.mem - package com.cloudera.crunch.impl.mem
 
com.cloudera.crunch.impl.mem.collect - package com.cloudera.crunch.impl.mem.collect
 
com.cloudera.crunch.impl.mr - package com.cloudera.crunch.impl.mr
 
com.cloudera.crunch.impl.mr.collect - package com.cloudera.crunch.impl.mr.collect
 
com.cloudera.crunch.impl.mr.emit - package com.cloudera.crunch.impl.mr.emit
 
com.cloudera.crunch.impl.mr.exec - package com.cloudera.crunch.impl.mr.exec
 
com.cloudera.crunch.impl.mr.plan - package com.cloudera.crunch.impl.mr.plan
 
com.cloudera.crunch.impl.mr.run - package com.cloudera.crunch.impl.mr.run
 
com.cloudera.crunch.io - package com.cloudera.crunch.io
 
com.cloudera.crunch.io.avro - package com.cloudera.crunch.io.avro
 
com.cloudera.crunch.io.hbase - package com.cloudera.crunch.io.hbase
 
com.cloudera.crunch.io.impl - package com.cloudera.crunch.io.impl
 
com.cloudera.crunch.io.seq - package com.cloudera.crunch.io.seq
 
com.cloudera.crunch.io.text - package com.cloudera.crunch.io.text
 
com.cloudera.crunch.lib - package com.cloudera.crunch.lib
 
com.cloudera.crunch.materialize - package com.cloudera.crunch.materialize
 
com.cloudera.crunch.test - package com.cloudera.crunch.test
 
com.cloudera.crunch.tool - package com.cloudera.crunch.tool
 
com.cloudera.crunch.type - package com.cloudera.crunch.type
 
com.cloudera.crunch.type.avro - package com.cloudera.crunch.type.avro
 
com.cloudera.crunch.type.writable - package com.cloudera.crunch.type.writable
 
com.cloudera.crunch.util - package com.cloudera.crunch.util
 
CombineFn<S,T> - Class in com.cloudera.crunch
A special DoFn implementation that converts an Iterable of values into a single value.
CombineFn() - Constructor for class com.cloudera.crunch.CombineFn
 
CombineFn.Aggregator<T> - Interface in com.cloudera.crunch
 
CombineFn.AggregatorCombineFn<K,V> - Class in com.cloudera.crunch
A CombineFn that delegates all of the actual work to an Aggregator instance.
CombineFn.AggregatorCombineFn(CombineFn.Aggregator<V>) - Constructor for class com.cloudera.crunch.CombineFn.AggregatorCombineFn
 
CombineFn.AggregatorFactory<T> - Interface in com.cloudera.crunch
Interface for constructing new aggregator instances.
CombineFn.FirstNAggregator<V> - Class in com.cloudera.crunch
 
CombineFn.FirstNAggregator(int) - Constructor for class com.cloudera.crunch.CombineFn.FirstNAggregator
 
CombineFn.LastNAggregator<V> - Class in com.cloudera.crunch
 
CombineFn.LastNAggregator(int) - Constructor for class com.cloudera.crunch.CombineFn.LastNAggregator
 
CombineFn.MaxBigInts - Class in com.cloudera.crunch
 
CombineFn.MaxBigInts() - Constructor for class com.cloudera.crunch.CombineFn.MaxBigInts
 
CombineFn.MaxDoubles - Class in com.cloudera.crunch
 
CombineFn.MaxDoubles() - Constructor for class com.cloudera.crunch.CombineFn.MaxDoubles
 
CombineFn.MaxFloats - Class in com.cloudera.crunch
 
CombineFn.MaxFloats() - Constructor for class com.cloudera.crunch.CombineFn.MaxFloats
 
CombineFn.MaxInts - Class in com.cloudera.crunch
 
CombineFn.MaxInts() - Constructor for class com.cloudera.crunch.CombineFn.MaxInts
 
CombineFn.MaxLongs - Class in com.cloudera.crunch
 
CombineFn.MaxLongs() - Constructor for class com.cloudera.crunch.CombineFn.MaxLongs
 
CombineFn.MaxNAggregator<V extends Comparable<V>> - Class in com.cloudera.crunch
 
CombineFn.MaxNAggregator(int) - Constructor for class com.cloudera.crunch.CombineFn.MaxNAggregator
 
CombineFn.MinBigInts - Class in com.cloudera.crunch
 
CombineFn.MinBigInts() - Constructor for class com.cloudera.crunch.CombineFn.MinBigInts
 
CombineFn.MinDoubles - Class in com.cloudera.crunch
 
CombineFn.MinDoubles() - Constructor for class com.cloudera.crunch.CombineFn.MinDoubles
 
CombineFn.MinFloats - Class in com.cloudera.crunch
 
CombineFn.MinFloats() - Constructor for class com.cloudera.crunch.CombineFn.MinFloats
 
CombineFn.MinInts - Class in com.cloudera.crunch
 
CombineFn.MinInts() - Constructor for class com.cloudera.crunch.CombineFn.MinInts
 
CombineFn.MinLongs - Class in com.cloudera.crunch
 
CombineFn.MinLongs() - Constructor for class com.cloudera.crunch.CombineFn.MinLongs
 
CombineFn.MinNAggregator<V extends Comparable<V>> - Class in com.cloudera.crunch
 
CombineFn.MinNAggregator(int) - Constructor for class com.cloudera.crunch.CombineFn.MinNAggregator
 
CombineFn.PairAggregator<V1,V2> - Class in com.cloudera.crunch
 
CombineFn.PairAggregator(CombineFn.Aggregator<V1>, CombineFn.Aggregator<V2>) - Constructor for class com.cloudera.crunch.CombineFn.PairAggregator
 
CombineFn.QuadAggregator<A,B,C,D> - Class in com.cloudera.crunch
 
CombineFn.QuadAggregator(CombineFn.Aggregator<A>, CombineFn.Aggregator<B>, CombineFn.Aggregator<C>, CombineFn.Aggregator<D>) - Constructor for class com.cloudera.crunch.CombineFn.QuadAggregator
 
CombineFn.SumBigInts - Class in com.cloudera.crunch
 
CombineFn.SumBigInts() - Constructor for class com.cloudera.crunch.CombineFn.SumBigInts
 
CombineFn.SumDoubles - Class in com.cloudera.crunch
 
CombineFn.SumDoubles() - Constructor for class com.cloudera.crunch.CombineFn.SumDoubles
 
CombineFn.SumFloats - Class in com.cloudera.crunch
 
CombineFn.SumFloats() - Constructor for class com.cloudera.crunch.CombineFn.SumFloats
 
CombineFn.SumInts - Class in com.cloudera.crunch
 
CombineFn.SumInts() - Constructor for class com.cloudera.crunch.CombineFn.SumInts
 
CombineFn.SumLongs - Class in com.cloudera.crunch
 
CombineFn.SumLongs() - Constructor for class com.cloudera.crunch.CombineFn.SumLongs
 
CombineFn.TripAggregator<A,B,C> - Class in com.cloudera.crunch
 
CombineFn.TripAggregator(CombineFn.Aggregator<A>, CombineFn.Aggregator<B>, CombineFn.Aggregator<C>) - Constructor for class com.cloudera.crunch.CombineFn.TripAggregator
 
CombineFn.TupleNAggregator - Class in com.cloudera.crunch
 
CombineFn.TupleNAggregator(CombineFn.Aggregator<?>...) - Constructor for class com.cloudera.crunch.CombineFn.TupleNAggregator
 
combineValues(CombineFn<K, V>) - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
combineValues(CombineFn<K, V>) - Method in interface com.cloudera.crunch.PGroupedTable
Combines the values of this grouping using the given CombineFn.
comm(PCollection<T>, PCollection<T>) - Static method in class com.cloudera.crunch.lib.Set
Find the elements that are common to two sets, like the Unix comm utility.
compare(Pair<K, V>, Pair<K, V>) - Method in class com.cloudera.crunch.lib.Aggregate.PairValueComparator
 
compare(AvroWrapper<T>, AvroWrapper<T>) - Method in class com.cloudera.crunch.lib.JoinUtils.AvroPairGroupingComparator
 
compare(byte[], int, int, byte[], int, int) - Method in class com.cloudera.crunch.lib.JoinUtils.AvroPairGroupingComparator
 
compare(TupleWritable, TupleWritable) - Method in class com.cloudera.crunch.lib.JoinUtils.TupleWritableComparator
 
compare(byte[], int, int, byte[], int, int) - Method in class com.cloudera.crunch.lib.JoinUtils.TupleWritableComparator
 
compareTo(Pair<K, V>) - Method in class com.cloudera.crunch.Pair
 
compareTo(TupleWritable) - Method in class com.cloudera.crunch.type.writable.TupleWritable
 
CompositeMapFn<R,S,T> - Class in com.cloudera.crunch.fn
 
CompositeMapFn(MapFn<R, S>, MapFn<S, T>) - Constructor for class com.cloudera.crunch.fn.CompositeMapFn
 
CompositePathIterable<T> - Class in com.cloudera.crunch.io
 
configure(Configuration) - Method in class com.cloudera.crunch.DoFn
Called during the job planning phase.
configure(Job) - Method in class com.cloudera.crunch.GroupingOptions
 
configure(Target, PType<?>) - Method in class com.cloudera.crunch.impl.mr.plan.MSCROutputHandler
 
configure(Target, PType<?>) - Method in interface com.cloudera.crunch.io.OutputHandler
 
configure(Configuration) - Method in class com.cloudera.crunch.type.avro.AvroUtf8InputFormat
 
configureForMapReduce(Job, PType<?>, Path, String) - Method in class com.cloudera.crunch.io.avro.AvroFileTarget
 
configureForMapReduce(Job, PType<?>, Path, String) - Method in class com.cloudera.crunch.io.hbase.HBaseTarget
 
configureForMapReduce(Job, PType<?>, Path, String) - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
configureForMapReduce(Job, Class, Class, Path, String) - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
configureForMapReduce(Job, PType<?>, Path, String) - Method in class com.cloudera.crunch.io.impl.SourcePathTargetImpl
 
configureForMapReduce(Job, PType<?>, Path, String) - Method in interface com.cloudera.crunch.io.MapReduceTarget
 
configureForMapReduce(Job, PType<?>, Path, String) - Method in class com.cloudera.crunch.io.PathTargetImpl
 
configureNode(DoNode, Target) - Method in class com.cloudera.crunch.impl.mr.plan.MSCROutputHandler
 
configureReflectDataFactory(Configuration) - Static method in class com.cloudera.crunch.type.avro.Avros
 
configureShuffle(Job) - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
configureShuffle(Job, GroupingOptions) - Method in class com.cloudera.crunch.type.avro.AvroGroupedTableType
 
configureShuffle(Job, GroupingOptions) - Method in class com.cloudera.crunch.type.PGroupedTableType
 
configureShuffle(Job, GroupingOptions) - Method in class com.cloudera.crunch.type.writable.WritableGroupedTableType
 
configureSource(Job, int) - Method in class com.cloudera.crunch.io.avro.AvroFileSource
 
configureSource(Job, int) - Method in class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
configureSource(Job, int) - Method in class com.cloudera.crunch.io.impl.FileSourceImpl
 
configureSource(Job, int) - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
configureSource(Job, int) - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
configureSource(Job, int) - Method in interface com.cloudera.crunch.Source
Configure the given job to use this source as an input.
containers(Class<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
containers(Class<T>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
ControlledJob - Class in org.apache.hadoop.mapreduce.lib.jobcontrol
This class encapsulates a MapReduce job and its dependency.
ControlledJob(Job, List<ControlledJob>) - Constructor for class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Construct a job.
ControlledJob(Configuration) - Constructor for class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Construct a job.
ControlledJob.State - Enum in org.apache.hadoop.mapreduce.lib.jobcontrol
 
convert(PType<T>, PTypeFamily) - Static method in class com.cloudera.crunch.type.PTypeUtils
 
Converter<K,V,S,T> - Interface in com.cloudera.crunch.type
Converts the input key/value from a MapReduce task into the input to a DoFn, or takes the output of a DoFn and write it to the output key/values.
convertInput(AvroWrapper<K>, NullWritable) - Method in class com.cloudera.crunch.type.avro.AvroKeyConverter
 
convertInput(AvroKey<K>, AvroValue<V>) - Method in class com.cloudera.crunch.type.avro.AvroPairConverter
 
convertInput(K, V) - Method in interface com.cloudera.crunch.type.Converter
 
convertInput(K, V) - Method in class com.cloudera.crunch.type.writable.WritablePairConverter
 
convertIterableInput(AvroWrapper<K>, Iterable<NullWritable>) - Method in class com.cloudera.crunch.type.avro.AvroKeyConverter
 
convertIterableInput(AvroKey<K>, Iterable<AvroValue<V>>) - Method in class com.cloudera.crunch.type.avro.AvroPairConverter
 
convertIterableInput(K, Iterable<V>) - Method in interface com.cloudera.crunch.type.Converter
 
convertIterableInput(K, Iterable<V>) - Method in class com.cloudera.crunch.type.writable.WritablePairConverter
 
count() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
count() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
count(PCollection<S>) - Static method in class com.cloudera.crunch.lib.Aggregate
Returns a PTable that contains the unique elements of this collection mapped to a count of their occurrences.
count() - Method in interface com.cloudera.crunch.PCollection
Returns a PTable instance that contains the counts of each unique element of this PCollection.
create() - Method in interface com.cloudera.crunch.CombineFn.AggregatorFactory
 
create(FileSystem, Path, FileReaderFactory<S>) - Static method in class com.cloudera.crunch.io.CompositePathIterable
 
create(Class<T>, Class...) - Static method in class com.cloudera.crunch.type.TupleFactory
 
CREATE_DIR - Static variable in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.DoCollectionImpl
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.DoTableImpl
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.InputTable
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.UnionCollection
 
createDoNode() - Method in class com.cloudera.crunch.impl.mr.collect.UnionTable
 
createFnNode(String, DoFn<?, ?>, PType<?>) - Static method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
createGroupingNode(String, PGroupedTableType<K, V>) - Static method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
createInputNode(Source<S>) - Static method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
createIntermediateOutput(PType<T>) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
createMapOnlyJob(HashMultimap<Target, NodePath>, Path) - Static method in class com.cloudera.crunch.impl.mr.plan.JobPrototype
 
createMapReduceJob(PGroupedTableImpl, Set<NodePath>, Path) - Static method in class com.cloudera.crunch.impl.mr.plan.JobPrototype
 
createOutputNode(String, PType<S>) - Static method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
createOutputPath() - Static method in class com.cloudera.crunch.test.FileHelper
 
createRecordReader(InputSplit, TaskAttemptContext) - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputFormat
 
createRecordReader(InputSplit, TaskAttemptContext) - Method in class com.cloudera.crunch.io.text.BZip2TextInputFormat
 
createRecordReader(InputSplit, TaskAttemptContext) - Method in class com.cloudera.crunch.type.avro.AvroInputFormat
 
createRecordReader(InputSplit, TaskAttemptContext) - Method in class com.cloudera.crunch.type.avro.AvroUtf8InputFormat
 
createTempCopyOf(String) - Static method in class com.cloudera.crunch.test.FileHelper
 
createTempPath() - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
CRUNCH_WORKING_DIRECTORY - Static variable in class com.cloudera.crunch.impl.mr.plan.PlanningParameters
 
CrunchCombiner - Class in com.cloudera.crunch.impl.mr.run
 
CrunchCombiner() - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchCombiner
 
CrunchInputFormat<K,V> - Class in com.cloudera.crunch.impl.mr.run
 
CrunchInputFormat() - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchInputFormat
 
CrunchInputs - Class in com.cloudera.crunch.impl.mr.run
 
CrunchInputs() - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchInputs
 
CrunchInputSplit - Class in com.cloudera.crunch.impl.mr.run
 
CrunchInputSplit() - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
CrunchInputSplit(InputSplit, Class<? extends InputFormat>, int, Configuration) - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
CrunchJob - Class in com.cloudera.crunch.impl.mr.exec
 
CrunchJob(Job, Path, MSCROutputHandler) - Constructor for class com.cloudera.crunch.impl.mr.exec.CrunchJob
 
CrunchMapper - Class in com.cloudera.crunch.impl.mr.run
 
CrunchMapper() - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchMapper
 
CrunchMultipleOutputs<KEYOUT,VALUEOUT> - Class in org.apache.hadoop.mapreduce.lib.output
The MultipleOutputs class simplifies writing output data to multiple outputs
CrunchMultipleOutputs(TaskInputOutputContext<?, ?, KEYOUT, VALUEOUT>) - Constructor for class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Creates and initializes multiple outputs support, it should be instantiated in the Mapper/Reducer setup method.
CrunchReducer - Class in com.cloudera.crunch.impl.mr.run
 
CrunchReducer() - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchReducer
 
CrunchRuntimeException - Exception in com.cloudera.crunch.impl.mr.run
 
CrunchRuntimeException(String) - Constructor for exception com.cloudera.crunch.impl.mr.run.CrunchRuntimeException
 
CrunchRuntimeException(Exception) - Constructor for exception com.cloudera.crunch.impl.mr.run.CrunchRuntimeException
 
CrunchTaskContext - Class in com.cloudera.crunch.impl.mr.run
 
CrunchTaskContext(TaskInputOutputContext<Object, Object, Object, Object>, NodeContext) - Constructor for class com.cloudera.crunch.impl.mr.run.CrunchTaskContext
 
CrunchTool - Class in com.cloudera.crunch.tool
An extension of the Tool interface that creates a Pipeline instance and provides methods for working with the Pipeline from inside of the Tool's run method.
CrunchTool() - Constructor for class com.cloudera.crunch.tool.CrunchTool
 
CrunchTool(boolean) - Constructor for class com.cloudera.crunch.tool.CrunchTool
 

D

DataBridge - Class in com.cloudera.crunch.type
Data structures for transitioning to the DoFns that make up a Crunch MapReduce task from the raw serialization input from the Hadoop MapReduce framework and back again.
DataBridge(Class<?>, Class<?>, Converter, MapFn, MapFn) - Constructor for class com.cloudera.crunch.type.DataBridge
 
DEBUG - Static variable in class com.cloudera.crunch.impl.mr.run.RuntimeParameters
 
derived(Class<T>, MapFn<S, T>, MapFn<T, S>, PType<S>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
derived(Class<T>, MapFn<S, T>, MapFn<T, S>, PType<S>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
derived(Class<T>, MapFn<S, T>, MapFn<T, S>, PType<S>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
derived(Class<T>, MapFn<S, T>, MapFn<T, S>, PType<S>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
derived(Class<T>, MapFn<S, T>, MapFn<T, S>, PType<S>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
difference(PCollection<T>, PCollection<T>) - Static method in class com.cloudera.crunch.lib.Set
Compute the set difference between two sets of elements.
DistCache - Class in com.cloudera.crunch.util
Functions for working with a job-specific distributed cache of objects, like the serialized runtime nodes in a MapReduce.
DistCache() - Constructor for class com.cloudera.crunch.util.DistCache
 
DoCollectionImpl<S> - Class in com.cloudera.crunch.impl.mr.collect
 
DoFn<S,T> - Class in com.cloudera.crunch
Base class for all data processing functions in Crunch.
DoFn() - Constructor for class com.cloudera.crunch.DoFn
 
done() - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
done() - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
done() - Method in interface com.cloudera.crunch.Pipeline
Run any remaining jobs required to generate outputs and then clean up any intermediate data files that were created in this run or previous calls to run.
done() - Method in class com.cloudera.crunch.tool.CrunchTool
 
DoNode - Class in com.cloudera.crunch.impl.mr.plan
 
DoTableImpl<K,V> - Class in com.cloudera.crunch.impl.mr.collect
 
doubles() - Static method in class com.cloudera.crunch.type.avro.Avros
 
doubles() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
doubles() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
doubles() - Static method in class com.cloudera.crunch.type.writable.Writables
 
doubles() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 

E

emit(T) - Method in interface com.cloudera.crunch.Emitter
Write the emitted value to the next stage of the pipeline.
emit(Object) - Method in class com.cloudera.crunch.impl.mr.emit.IntermediateEmitter
 
emit(T) - Method in class com.cloudera.crunch.impl.mr.emit.MultipleOutputEmitter
 
emit(T) - Method in class com.cloudera.crunch.impl.mr.emit.OutputEmitter
 
Emitter<T> - Interface in com.cloudera.crunch
Interface for writing outputs from a DoFn.
enableDebug() - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
enableDebug() - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
enableDebug() - Method in interface com.cloudera.crunch.Pipeline
Turn on debug logging for jobs that are run from this pipeline.
enableDebug() - Method in class com.cloudera.crunch.tool.CrunchTool
 
entrySet() - Method in class com.cloudera.crunch.type.writable.TextMapWritable
 
equals(Object) - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
equals(Object) - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
equals(Object) - Method in class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
equals(Object) - Method in class com.cloudera.crunch.io.hbase.HBaseTarget
 
equals(Object) - Method in class com.cloudera.crunch.io.impl.FileSourceImpl
 
equals(Object) - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
equals(Object) - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
equals(Object) - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
equals(Object) - Method in class com.cloudera.crunch.Pair
 
equals(Object) - Method in class com.cloudera.crunch.Tuple3
 
equals(Object) - Method in class com.cloudera.crunch.Tuple4
 
equals(Object) - Method in class com.cloudera.crunch.TupleN
 
equals(Object) - Method in class com.cloudera.crunch.type.avro.AvroType
 
equals(Object) - Method in class com.cloudera.crunch.type.DataBridge
 
equals(Object) - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
equals(Object) - Method in class com.cloudera.crunch.type.writable.TupleWritable
equals(Object) - Method in class com.cloudera.crunch.type.writable.WritableType
 
execute() - Method in class com.cloudera.crunch.impl.mr.exec.MRExecutor
 

F

FileHelper - Class in com.cloudera.crunch.test
 
FileHelper() - Constructor for class com.cloudera.crunch.test.FileHelper
 
FileReaderFactory<T> - Interface in com.cloudera.crunch.io
 
FileSourceImpl<T> - Class in com.cloudera.crunch.io.impl
 
FileSourceImpl(Path, PType<T>, Class<? extends FileInputFormat>) - Constructor for class com.cloudera.crunch.io.impl.FileSourceImpl
 
FileTableSourceImpl<K,V> - Class in com.cloudera.crunch.io.impl
 
FileTableSourceImpl(Path, PTableType<K, V>, Class<? extends FileInputFormat>) - Constructor for class com.cloudera.crunch.io.impl.FileTableSourceImpl
 
FileTargetImpl - Class in com.cloudera.crunch.io.impl
 
FileTargetImpl(Path, Class<? extends FileOutputFormat>) - Constructor for class com.cloudera.crunch.io.impl.FileTargetImpl
 
filter(FilterFn<S>) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
filter(FilterFn<S>) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
filter(FilterFn<S>) - Method in interface com.cloudera.crunch.PCollection
Apply the given filter function to this instance and return the resulting PCollection.
FilterFn<T> - Class in com.cloudera.crunch
A DoFn for the common case of filtering the members of a PCollection based on a boolean condition.
FilterFn() - Constructor for class com.cloudera.crunch.FilterFn
 
FilterFn.AndFn<S> - Class in com.cloudera.crunch
 
FilterFn.AndFn(FilterFn<S>...) - Constructor for class com.cloudera.crunch.FilterFn.AndFn
 
FilterFn.NotFn<S> - Class in com.cloudera.crunch
 
FilterFn.NotFn(FilterFn<S>) - Constructor for class com.cloudera.crunch.FilterFn.NotFn
 
FilterFn.OrFn<S> - Class in com.cloudera.crunch
 
FilterFn.OrFn(FilterFn<S>...) - Constructor for class com.cloudera.crunch.FilterFn.OrFn
 
first() - Method in class com.cloudera.crunch.Pair
 
first() - Method in class com.cloudera.crunch.Tuple3
 
first() - Method in class com.cloudera.crunch.Tuple4
 
FIRST_N(int) - Static method in class com.cloudera.crunch.CombineFn
 
floats() - Static method in class com.cloudera.crunch.type.avro.Avros
 
floats() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
floats() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
floats() - Static method in class com.cloudera.crunch.type.writable.Writables
 
floats() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
flush() - Method in interface com.cloudera.crunch.Emitter
Flushes any values cached by this emitter.
flush() - Method in class com.cloudera.crunch.impl.mr.emit.IntermediateEmitter
 
flush() - Method in class com.cloudera.crunch.impl.mr.emit.MultipleOutputEmitter
 
flush() - Method in class com.cloudera.crunch.impl.mr.emit.OutputEmitter
 
formattedFile(String, Class<? extends FileInputFormat>, PType<K>, PType<V>) - Static method in class com.cloudera.crunch.io.From
 
formattedFile(Path, Class<? extends FileInputFormat>, PType<K>, PType<V>) - Static method in class com.cloudera.crunch.io.From
 
formattedFile(String, Class<? extends FileOutputFormat>) - Static method in class com.cloudera.crunch.io.To
 
formattedFile(Path, Class<? extends FileOutputFormat>) - Static method in class com.cloudera.crunch.io.To
 
fourth() - Method in class com.cloudera.crunch.Tuple4
 
From - Class in com.cloudera.crunch.io
Static factory methods for creating various Source types.
From() - Constructor for class com.cloudera.crunch.io.From
 
from - Static variable in class com.cloudera.crunch.tool.CrunchTool
 

G

GenericArrayWritable<T> - Class in com.cloudera.crunch.type.writable
 
GenericArrayWritable(Class<? extends Writable>) - Constructor for class com.cloudera.crunch.type.writable.GenericArrayWritable
 
GenericArrayWritable() - Constructor for class com.cloudera.crunch.type.writable.GenericArrayWritable
 
generics(Schema) - Static method in class com.cloudera.crunch.type.avro.Avros
 
generics(Schema) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
get(int) - Method in class com.cloudera.crunch.Pair
 
get(int) - Method in interface com.cloudera.crunch.Tuple
Returns the Object at the given index.
get(int) - Method in class com.cloudera.crunch.Tuple3
 
get(int) - Method in class com.cloudera.crunch.Tuple4
 
get(int) - Method in class com.cloudera.crunch.TupleN
 
get() - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
get(int) - Method in class com.cloudera.crunch.type.writable.TupleWritable
Get ith Writable from Tuple.
getChildren() - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
getCollection() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
getConf() - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
getConf() - Method in class com.cloudera.crunch.tool.CrunchTool
 
getConfiguration() - Method in class com.cloudera.crunch.DoFn
 
getConfiguration() - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
getConfiguration() - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
getConfiguration() - Method in interface com.cloudera.crunch.Pipeline
Returns the Configuration instance associated with this pipeline.
getConfigurationKey() - Method in enum com.cloudera.crunch.impl.mr.run.NodeContext
 
getContext() - Method in class com.cloudera.crunch.impl.mr.run.CrunchTaskContext
 
getConverter() - Method in class com.cloudera.crunch.type.avro.AvroType
 
getConverter() - Method in class com.cloudera.crunch.type.DataBridge
 
getConverter() - Method in class com.cloudera.crunch.type.PGroupedTableType
 
getConverter() - Method in interface com.cloudera.crunch.type.PType
 
getConverter() - Method in class com.cloudera.crunch.type.writable.WritableType
 
getCounter(Enum<?>) - Method in class com.cloudera.crunch.DoFn
 
getCounter(String, String) - Method in class com.cloudera.crunch.DoFn
 
getCounter(Enum<?>) - Static method in class com.cloudera.crunch.test.TestCounters
 
getCounter(String, String) - Static method in class com.cloudera.crunch.test.TestCounters
 
getCountersEnabled(JobContext) - Static method in class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Returns if the counters for the named outputs are enabled or not.
getCrunchJob(Class<?>, Configuration) - Method in class com.cloudera.crunch.impl.mr.plan.JobPrototype
 
getCurrentKey() - Method in class com.cloudera.crunch.type.avro.AvroRecordReader
 
getCurrentValue() - Method in class com.cloudera.crunch.type.avro.AvroRecordReader
 
getDefaultFileSource(Path) - Method in class com.cloudera.crunch.type.avro.AvroType
 
getDefaultFileSource(Path) - Method in class com.cloudera.crunch.type.PGroupedTableType
 
getDefaultFileSource(Path) - Method in interface com.cloudera.crunch.type.PType
Returns a SourceTarget that is able to read/write data using the serialization format specified by this PType.
getDefaultFileSource(Path) - Method in class com.cloudera.crunch.type.writable.WritableType
 
getDependentJobs() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
getDepth() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getDeserializer(Class<AvroWrapper<T>>) - Method in class com.cloudera.crunch.type.avro.SafeAvroSerialization
Returns the specified map output deserializer.
getFailedJobList() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
 
getFamily() - Method in class com.cloudera.crunch.type.avro.AvroType
 
getFamily() - Method in class com.cloudera.crunch.type.PGroupedTableType
 
getFamily() - Method in interface com.cloudera.crunch.type.PType
Returns the PTypeFamily that this PType belongs to.
getFamily() - Method in class com.cloudera.crunch.type.writable.WritableType
 
getFirst() - Method in class com.cloudera.crunch.fn.CompositeMapFn
 
getFormatNodeMap(JobContext) - Static method in class com.cloudera.crunch.impl.mr.run.CrunchInputs
 
getGroupedTableType() - Method in class com.cloudera.crunch.type.avro.AvroTableType
 
getGroupedTableType() - Method in interface com.cloudera.crunch.type.PTableType
Returns the grouped table version of this type.
getGroupingComparator(PTypeFamily) - Static method in class com.cloudera.crunch.lib.JoinUtils
 
getGroupingConverter() - Method in class com.cloudera.crunch.type.avro.AvroGroupedTableType
 
getGroupingConverter() - Method in class com.cloudera.crunch.type.PGroupedTableType
 
getGroupingConverter() - Method in class com.cloudera.crunch.type.writable.WritableGroupedTableType
 
getGroupingNode() - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
getInputFormatClass() - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
getInputMapFn() - Method in class com.cloudera.crunch.type.avro.AvroGroupedTableType
 
getInputMapFn() - Method in class com.cloudera.crunch.type.avro.AvroType
 
getInputMapFn() - Method in class com.cloudera.crunch.type.DataBridge
 
getInputMapFn() - Method in interface com.cloudera.crunch.type.PType
 
getInputMapFn() - Method in class com.cloudera.crunch.type.writable.WritableGroupedTableType
 
getInputMapFn() - Method in class com.cloudera.crunch.type.writable.WritableType
 
getInputSplit() - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
getInstance() - Static method in class com.cloudera.crunch.fn.IdentityFn
 
getInstance() - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
getInstance() - Static method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
getInstance() - Static method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
getJob() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
getJobID() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
getJobName() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
getJobState() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
getKeyClass() - Method in class com.cloudera.crunch.type.avro.AvroKeyConverter
 
getKeyClass() - Method in class com.cloudera.crunch.type.avro.AvroPairConverter
 
getKeyClass() - Method in interface com.cloudera.crunch.type.Converter
 
getKeyClass() - Method in class com.cloudera.crunch.type.writable.WritablePairConverter
 
getKeyType() - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
getKeyType() - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
getKeyType() - Method in interface com.cloudera.crunch.PTable
Returns the PType of the key.
getKeyType() - Method in class com.cloudera.crunch.type.avro.AvroTableType
 
getKeyType() - Method in interface com.cloudera.crunch.type.PTableType
Returns the key type for the table.
getLength() - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
getLocations() - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
getMapredJobID() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
getMaterializedAt() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getMessage() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
getMultiPaths() - Method in class com.cloudera.crunch.impl.mr.plan.MSCROutputHandler
 
getMultipleOutputs() - Method in class com.cloudera.crunch.impl.mr.run.CrunchTaskContext
 
getName() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
getName() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getName() - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
getName() - Method in interface com.cloudera.crunch.PCollection
Returns a shorthand name for this PCollection.
getNextAnonymousStageId() - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
getNodeContext() - Method in class com.cloudera.crunch.impl.mr.run.CrunchCombiner
 
getNodeContext() - Method in class com.cloudera.crunch.impl.mr.run.CrunchReducer
 
getNodeContext() - Method in class com.cloudera.crunch.impl.mr.run.CrunchTaskContext
 
getNodeIndex() - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
getNodes() - Method in class com.cloudera.crunch.impl.mr.run.CrunchTaskContext
 
getNumReducers() - Method in class com.cloudera.crunch.GroupingOptions
 
getOnlyParent() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getOutputMapFn() - Method in class com.cloudera.crunch.type.avro.AvroGroupedTableType
 
getOutputMapFn() - Method in class com.cloudera.crunch.type.avro.AvroType
 
getOutputMapFn() - Method in class com.cloudera.crunch.type.DataBridge
 
getOutputMapFn() - Method in interface com.cloudera.crunch.type.PType
 
getOutputMapFn() - Method in class com.cloudera.crunch.type.writable.WritableGroupedTableType
 
getOutputMapFn() - Method in class com.cloudera.crunch.type.writable.WritableType
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.DoCollectionImpl
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.DoTableImpl
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.InputTable
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.UnionCollection
 
getParents() - Method in class com.cloudera.crunch.impl.mr.collect.UnionTable
 
getPartition(AvroKey, AvroValue, int) - Method in class com.cloudera.crunch.lib.JoinUtils.AvroIndexedRecordPartitioner
 
getPartition(TupleWritable, Writable, int) - Method in class com.cloudera.crunch.lib.JoinUtils.TupleWritablePartitioner
 
getPartitionerClass(PTypeFamily) - Static method in class com.cloudera.crunch.lib.JoinUtils
 
getPath() - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
getPath() - Method in class com.cloudera.crunch.io.impl.SourcePathTargetImpl
 
getPath() - Method in interface com.cloudera.crunch.io.PathTarget
 
getPath() - Method in class com.cloudera.crunch.io.PathTargetImpl
 
getPath() - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
getPath() - Method in class com.cloudera.crunch.io.text.TextFileTarget
 
getPathSize(Configuration, Path) - Static method in class com.cloudera.crunch.io.SourceTargetHelper
 
getPathSize(FileSystem, Path) - Static method in class com.cloudera.crunch.io.SourceTargetHelper
 
getPipeline() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
getPipeline() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getPipeline() - Method in interface com.cloudera.crunch.PCollection
Returns the Pipeline associated with this PCollection.
getPos() - Method in class com.cloudera.crunch.io.text.CBZip2InputStream
getPos is used by the caller to know when the processing of the current InputSplit is complete.
getPos() - Method in class com.cloudera.crunch.type.avro.AvroRecordReader
 
getPrimitiveType(Class<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
getPrimitiveType(Class<T>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
getProgress() - Method in class com.cloudera.crunch.type.avro.AvroRecordReader
 
getPTableType() - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
getPTableType() - Method in class com.cloudera.crunch.impl.mr.collect.DoTableImpl
 
getPTableType() - Method in class com.cloudera.crunch.impl.mr.collect.InputTable
 
getPTableType() - Method in class com.cloudera.crunch.impl.mr.collect.UnionTable
 
getPTableType() - Method in interface com.cloudera.crunch.PTable
Returns the PTableType of this PTable.
getPType() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
getPType() - Method in class com.cloudera.crunch.impl.mr.collect.DoCollectionImpl
 
getPType() - Method in class com.cloudera.crunch.impl.mr.collect.DoTableImpl
 
getPType() - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
getPType() - Method in class com.cloudera.crunch.impl.mr.collect.InputTable
 
getPType() - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
getPType() - Method in class com.cloudera.crunch.impl.mr.collect.UnionCollection
 
getPType() - Method in class com.cloudera.crunch.impl.mr.collect.UnionTable
 
getPType() - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
getPType() - Method in interface com.cloudera.crunch.PCollection
Returns the PType of this PCollection.
getReadCount() - Method in class com.cloudera.crunch.io.text.CBZip2InputStream
 
getReader(Schema) - Method in class com.cloudera.crunch.type.avro.ReflectDataFactory
 
getReadLimit() - Method in class com.cloudera.crunch.io.text.CBZip2InputStream
 
getReadyJobsList() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
 
getRecordWriter(TaskAttemptContext) - Method in class com.cloudera.crunch.type.avro.AvroOutputFormat
 
getReflectData() - Method in class com.cloudera.crunch.type.avro.ReflectDataFactory
 
getReflectDataFactory(Configuration) - Static method in class com.cloudera.crunch.type.avro.Avros
 
getRunningJobList() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
 
getSchema() - Method in class com.cloudera.crunch.type.avro.AvroType
 
getSecond() - Method in class com.cloudera.crunch.fn.CompositeMapFn
 
getSerializationClass() - Method in class com.cloudera.crunch.type.writable.WritableType
 
getSerializer(Class<AvroWrapper<T>>) - Method in class com.cloudera.crunch.type.avro.SafeAvroSerialization
Returns the specified output serializer.
getSize() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
getSize() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getSize(Configuration) - Method in class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
getSize(Configuration) - Method in class com.cloudera.crunch.io.impl.FileSourceImpl
 
getSize(Configuration) - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
getSize(Configuration) - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
getSize(Configuration) - Method in class com.cloudera.crunch.io.text.TextFileSource
 
getSize() - Method in interface com.cloudera.crunch.PCollection
Returns the size of the data represented by this PCollection in bytes.
getSize(Configuration) - Method in interface com.cloudera.crunch.Source
Returns the number of bytes in this Source.
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.DoCollectionImpl
 
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.DoTableImpl
 
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.InputTable
 
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.UnionCollection
 
getSizeInternal() - Method in class com.cloudera.crunch.impl.mr.collect.UnionTable
 
getSortComparatorClass() - Method in class com.cloudera.crunch.GroupingOptions
 
getSource() - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
getSource() - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
getSourceTarget() - Method in class com.cloudera.crunch.materialize.MaterializableIterable
 
getSplits(JobContext) - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputFormat
 
getStatus() - Method in class com.cloudera.crunch.DoFn
 
getSubTypes() - Method in class com.cloudera.crunch.type.avro.AvroType
 
getSubTypes() - Method in class com.cloudera.crunch.type.PGroupedTableType
 
getSubTypes() - Method in interface com.cloudera.crunch.type.PType
Returns the sub-types that make up this PType if it is a composite instance, such as a tuple.
getSubTypes() - Method in class com.cloudera.crunch.type.writable.WritableType
 
getSuccessfulJobList() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
 
getTableType() - Method in class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
getTableType() - Method in class com.cloudera.crunch.io.impl.FileTableSourceImpl
 
getTableType() - Method in class com.cloudera.crunch.io.impl.TableSourcePathTargetImpl
 
getTableType() - Method in class com.cloudera.crunch.io.impl.TableSourceTargetImpl
 
getTableType() - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
getTableType() - Method in interface com.cloudera.crunch.TableSource
 
getTableType() - Method in class com.cloudera.crunch.type.PGroupedTableType
 
getTaskAttemptID() - Method in class com.cloudera.crunch.DoFn
 
getThreadState() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
 
getType() - Method in class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
getType() - Method in class com.cloudera.crunch.io.impl.FileSourceImpl
 
getType() - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
getType() - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
getType() - Method in interface com.cloudera.crunch.Source
Returns the PType for this source.
getTypeClass() - Method in class com.cloudera.crunch.type.avro.AvroGroupedTableType
 
getTypeClass() - Method in class com.cloudera.crunch.type.avro.AvroType
 
getTypeClass() - Method in interface com.cloudera.crunch.type.PType
Returns the Java type represented by this PType.
getTypeClass() - Method in class com.cloudera.crunch.type.writable.WritableGroupedTableType
 
getTypeClass() - Method in class com.cloudera.crunch.type.writable.WritableType
 
getTypeFamily() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
getTypeFamily() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
getTypeFamily() - Method in interface com.cloudera.crunch.PCollection
Returns the PTypeFamily of this PCollection.
getValueClass() - Method in class com.cloudera.crunch.type.avro.AvroKeyConverter
 
getValueClass() - Method in class com.cloudera.crunch.type.avro.AvroPairConverter
 
getValueClass() - Method in interface com.cloudera.crunch.type.Converter
 
getValueClass() - Method in class com.cloudera.crunch.type.writable.WritablePairConverter
 
getValueType() - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
getValueType() - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
getValueType() - Method in interface com.cloudera.crunch.PTable
Returns the PType of the value.
getValueType() - Method in class com.cloudera.crunch.type.avro.AvroTableType
 
getValueType() - Method in interface com.cloudera.crunch.type.PTableType
Returns the value type for the table.
getWaitingJobList() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
 
getWriter() - Method in class com.cloudera.crunch.type.avro.ReflectDataFactory
 
groupByKey() - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
groupByKey(int) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
groupByKey(GroupingOptions) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
groupByKey() - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
groupByKey(int) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
groupByKey(GroupingOptions) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
groupByKey() - Method in interface com.cloudera.crunch.PTable
Performs a grouping operation on the keys of this table.
groupByKey(int) - Method in interface com.cloudera.crunch.PTable
Performs a grouping operation on the keys of this table, using the given number of partitions.
groupByKey(GroupingOptions) - Method in interface com.cloudera.crunch.PTable
Performs a grouping operation on the keys of this table, using the additional GroupingOptions to control how the grouping is executed.
groupingComparatorClass(Class<? extends RawComparator>) - Method in class com.cloudera.crunch.GroupingOptions.Builder
 
GroupingOptions - Class in com.cloudera.crunch
Options that can be passed to a groupByKey operation in order to exercise finer control over how the partitioning, grouping, and sorting of keys is performed.
GroupingOptions.Builder - Class in com.cloudera.crunch
Builder class for creating GroupingOptions instances.
GroupingOptions.Builder() - Constructor for class com.cloudera.crunch.GroupingOptions.Builder
 

H

has(int) - Method in class com.cloudera.crunch.type.writable.TupleWritable
Return true if tuple has an element at the position provided.
hasCombineFn() - Method in class com.cloudera.crunch.impl.mr.collect.DoTableImpl
 
hashCode() - Method in class com.cloudera.crunch.impl.mr.collect.InputCollection
 
hashCode() - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
hashCode() - Method in class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
hashCode() - Method in class com.cloudera.crunch.io.hbase.HBaseTarget
 
hashCode() - Method in class com.cloudera.crunch.io.impl.FileSourceImpl
 
hashCode() - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
hashCode() - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
hashCode() - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
hashCode() - Method in class com.cloudera.crunch.Pair
 
hashCode() - Method in class com.cloudera.crunch.Tuple3
 
hashCode() - Method in class com.cloudera.crunch.Tuple4
 
hashCode() - Method in class com.cloudera.crunch.TupleN
 
hashCode() - Method in class com.cloudera.crunch.type.avro.AvroType
 
hashCode() - Method in class com.cloudera.crunch.type.DataBridge
 
hashCode() - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
hashCode() - Method in class com.cloudera.crunch.type.writable.TupleWritable
 
hashCode() - Method in class com.cloudera.crunch.type.writable.WritableType
 
HBaseSourceTarget - Class in com.cloudera.crunch.io.hbase
 
HBaseSourceTarget(String, Scan) - Constructor for class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
hbaseTable(String) - Static method in class com.cloudera.crunch.io.At
 
hbaseTable(String, Scan) - Static method in class com.cloudera.crunch.io.At
 
hbaseTable(String) - Static method in class com.cloudera.crunch.io.From
 
hbaseTable(String, Scan) - Static method in class com.cloudera.crunch.io.From
 
hbaseTable(String) - Static method in class com.cloudera.crunch.io.To
 
HBaseTarget - Class in com.cloudera.crunch.io.hbase
 
HBaseTarget(String) - Constructor for class com.cloudera.crunch.io.hbase.HBaseTarget
 

I

IdentityFn<T> - Class in com.cloudera.crunch.fn
 
initialize() - Method in class com.cloudera.crunch.DoFn
Called during the setup of the MapReduce job this DoFn is associated with.
initialize() - Method in class com.cloudera.crunch.fn.CompositeMapFn
 
initialize() - Method in class com.cloudera.crunch.fn.PairMapFn
 
initialize(CrunchTaskContext) - Method in class com.cloudera.crunch.impl.mr.run.RTNode
 
initialize() - Method in class com.cloudera.crunch.lib.Aggregate.TopKFn
 
initialize() - Method in class com.cloudera.crunch.lib.Sample.SamplerFn
 
initialize(InputSplit, TaskAttemptContext) - Method in class com.cloudera.crunch.type.avro.AvroRecordReader
 
initialize() - Method in class com.cloudera.crunch.type.PGroupedTableType.PairIterableMapFn
 
initialize() - Method in class com.cloudera.crunch.type.TupleFactory
 
initialize() - Method in class com.cloudera.crunch.util.PTypes.JacksonInputMapFn
 
initialize() - Method in class com.cloudera.crunch.util.PTypes.JacksonOutputMapFn
 
initialize() - Method in class com.cloudera.crunch.util.PTypes.ProtoInputMapFn
 
initialize() - Method in class com.cloudera.crunch.util.PTypes.SmileInputMapFn
 
initialize() - Method in class com.cloudera.crunch.util.PTypes.SmileOutputMapFn
 
initialize() - Method in class com.cloudera.crunch.util.PTypes.ThriftInputMapFn
 
initialize() - Method in class com.cloudera.crunch.util.PTypes.ThriftOutputMapFn
 
innerJoin(PTable<K, U>, PTable<K, V>) - Static method in class com.cloudera.crunch.lib.Join
 
InputCollection<S> - Class in com.cloudera.crunch.impl.mr.collect
 
InputCollection(Source<S>, MRPipeline) - Constructor for class com.cloudera.crunch.impl.mr.collect.InputCollection
 
inputFormatClass - Variable in class com.cloudera.crunch.io.impl.FileSourceImpl
 
InputTable<K,V> - Class in com.cloudera.crunch.impl.mr.collect
 
InputTable(TableSource<K, V>, MRPipeline) - Constructor for class com.cloudera.crunch.impl.mr.collect.InputTable
 
IntermediateEmitter - Class in com.cloudera.crunch.impl.mr.emit
An Emitter implementation that links the output of one DoFn to the input of another DoFn.
IntermediateEmitter(List<RTNode>) - Constructor for class com.cloudera.crunch.impl.mr.emit.IntermediateEmitter
 
intersection(PCollection<T>, PCollection<T>) - Static method in class com.cloudera.crunch.lib.Set
Compute the intersection of two sets of elements.
ints() - Static method in class com.cloudera.crunch.type.avro.Avros
 
ints() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
ints() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
ints() - Static method in class com.cloudera.crunch.type.writable.Writables
 
ints() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
isCompatibleWith(GroupingOptions) - Method in class com.cloudera.crunch.GroupingOptions
 
isCompleted() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
isDebugRun() - Method in class com.cloudera.crunch.impl.mr.run.CrunchTaskContext
 
isInputNode() - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
isLeafNode() - Method in class com.cloudera.crunch.impl.mr.run.RTNode
 
isMapOnlyJob() - Method in class com.cloudera.crunch.impl.mr.plan.MSCROutputHandler
 
isOutputNode() - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
isReady() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
isSpecific() - Method in class com.cloudera.crunch.type.avro.AvroType
Determine if the wrapped type is a specific or generic avro type.
isSplitable(JobContext, Path) - Method in class com.cloudera.crunch.io.text.BZip2TextInputFormat
 
isSplitable(FileSystem, Path) - Method in class com.cloudera.crunch.type.avro.AvroUtf8InputFormat
 
iterator() - Method in class com.cloudera.crunch.io.CompositePathIterable
 
iterator() - Method in class com.cloudera.crunch.materialize.MaterializableIterable
 
iterator() - Method in class com.cloudera.crunch.type.PGroupedTableType.PTypeIterable
 
iterator() - Method in class com.cloudera.crunch.util.Tuples.PairIterable
 
iterator() - Method in class com.cloudera.crunch.util.Tuples.QuadIterable
 
iterator() - Method in class com.cloudera.crunch.util.Tuples.TripIterable
 
iterator() - Method in class com.cloudera.crunch.util.Tuples.TupleNIterable
 

J

job - Variable in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
JobControl - Class in org.apache.hadoop.mapreduce.lib.jobcontrol
This class encapsulates a set of MapReduce jobs and its dependency.
JobControl(String) - Constructor for class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
Construct a job control for a group of jobs.
JobControl.ThreadState - Enum in org.apache.hadoop.mapreduce.lib.jobcontrol
 
JobNameBuilder - Class in com.cloudera.crunch.impl.mr.plan
Visitor that traverses the DoNode instances in a job and builds a String that identifies the stages of the pipeline that belong to this job.
JobNameBuilder() - Constructor for class com.cloudera.crunch.impl.mr.plan.JobNameBuilder
 
JobPrototype - Class in com.cloudera.crunch.impl.mr.plan
 
join(PTable<K, U>) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
join(PTable<K, U>) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
Join - Class in com.cloudera.crunch.lib
Utilities for joining multiple PTable instances based on a common key.
Join() - Constructor for class com.cloudera.crunch.lib.Join
 
join(PTable<K, U>, PTable<K, V>) - Static method in class com.cloudera.crunch.lib.Join
 
join(PTable<K, U>) - Method in interface com.cloudera.crunch.PTable
Perform an inner join on this table and the one passed in as an argument on their common keys.
JoinUtils - Class in com.cloudera.crunch.lib
Utilities that are useful in joining multiple data sets via a MapReduce.
JoinUtils() - Constructor for class com.cloudera.crunch.lib.JoinUtils
 
JoinUtils.AvroIndexedRecordPartitioner - Class in com.cloudera.crunch.lib
 
JoinUtils.AvroIndexedRecordPartitioner() - Constructor for class com.cloudera.crunch.lib.JoinUtils.AvroIndexedRecordPartitioner
 
JoinUtils.AvroPairGroupingComparator<T> - Class in com.cloudera.crunch.lib
 
JoinUtils.AvroPairGroupingComparator() - Constructor for class com.cloudera.crunch.lib.JoinUtils.AvroPairGroupingComparator
 
JoinUtils.TupleWritableComparator - Class in com.cloudera.crunch.lib
 
JoinUtils.TupleWritableComparator() - Constructor for class com.cloudera.crunch.lib.JoinUtils.TupleWritableComparator
 
JoinUtils.TupleWritablePartitioner - Class in com.cloudera.crunch.lib
 
JoinUtils.TupleWritablePartitioner() - Constructor for class com.cloudera.crunch.lib.JoinUtils.TupleWritablePartitioner
 
jsons(Class<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
jsons(Class<T>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
jsonString(Class<T>, PTypeFamily) - Static method in class com.cloudera.crunch.util.PTypes
 

K

keys(PTable<K, V>) - Static method in class com.cloudera.crunch.lib.PTables
 
killJob() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 

L

LAST_N(int) - Static method in class com.cloudera.crunch.CombineFn
 
leftJoin(PTable<K, U>, PTable<K, V>) - Static method in class com.cloudera.crunch.lib.Join
 
listStatus(JobContext) - Method in class com.cloudera.crunch.type.avro.AvroInputFormat
 
longs() - Static method in class com.cloudera.crunch.type.avro.Avros
 
longs() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
longs() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
longs() - Static method in class com.cloudera.crunch.type.writable.Writables
 
longs() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 

M

makeTuple(Object...) - Method in class com.cloudera.crunch.type.TupleFactory
 
map(R) - Method in class com.cloudera.crunch.fn.CompositeMapFn
 
map(T) - Method in class com.cloudera.crunch.fn.IdentityFn
 
map(K1) - Method in class com.cloudera.crunch.fn.MapKeysFn
 
map(V1) - Method in class com.cloudera.crunch.fn.MapValuesFn
 
map(Pair<K, V>) - Method in class com.cloudera.crunch.fn.PairMapFn
 
map(Object, Object, Mapper<Object, Object, Object, Object>.Context) - Method in class com.cloudera.crunch.impl.mr.run.CrunchMapper
 
map(S) - Method in class com.cloudera.crunch.MapFn
Maps the given input into an instance of the output type.
map(Pair<Object, Iterable<Object>>) - Method in class com.cloudera.crunch.type.PGroupedTableType.PairIterableMapFn
 
map(String) - Method in class com.cloudera.crunch.util.PTypes.JacksonInputMapFn
 
map(T) - Method in class com.cloudera.crunch.util.PTypes.JacksonOutputMapFn
 
map(ByteBuffer) - Method in class com.cloudera.crunch.util.PTypes.ProtoInputMapFn
 
map(T) - Method in class com.cloudera.crunch.util.PTypes.ProtoOutputMapFn
 
map(ByteBuffer) - Method in class com.cloudera.crunch.util.PTypes.SmileInputMapFn
 
map(T) - Method in class com.cloudera.crunch.util.PTypes.SmileOutputMapFn
 
map(ByteBuffer) - Method in class com.cloudera.crunch.util.PTypes.ThriftInputMapFn
 
map(T) - Method in class com.cloudera.crunch.util.PTypes.ThriftOutputMapFn
 
MapFn<S,T> - Class in com.cloudera.crunch
A DoFn for the common case of emitting exactly one value for each input record.
MapFn() - Constructor for class com.cloudera.crunch.MapFn
 
MapKeysFn<K1,K2,V> - Class in com.cloudera.crunch.fn
 
MapKeysFn() - Constructor for class com.cloudera.crunch.fn.MapKeysFn
 
MapReduceTarget - Interface in com.cloudera.crunch.io
 
maps(PType<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
maps(PType<T>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
maps(PType<T>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
maps(PType<T>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
maps(PType<T>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
MapValuesFn<K,V1,V2> - Class in com.cloudera.crunch.fn
 
MapValuesFn() - Constructor for class com.cloudera.crunch.fn.MapValuesFn
 
markLogged() - Method in exception com.cloudera.crunch.impl.mr.run.CrunchRuntimeException
 
MaterializableIterable<E> - Class in com.cloudera.crunch.materialize
 
MaterializableIterable(Pipeline, ReadableSourceTarget<E>) - Constructor for class com.cloudera.crunch.materialize.MaterializableIterable
 
materialize() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
materialize(PCollection<T>) - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
materialize() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
materialize(PCollection<T>) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
materialize() - Method in class com.cloudera.crunch.materialize.MaterializableIterable
 
materialize() - Method in interface com.cloudera.crunch.PCollection
Returns a reference to the data set represented by this PCollection that may be used by the client to read the data locally.
materialize(PCollection<T>) - Method in interface com.cloudera.crunch.Pipeline
Create the given PCollection and read the data it contains into the returned Collection instance for client use.
materializeAt(SourceTarget<S>) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
max() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
max() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
max(PCollection<S>) - Static method in class com.cloudera.crunch.lib.Aggregate
Returns the largest numerical element from the input collection.
max() - Method in interface com.cloudera.crunch.PCollection
Returns a PCollection made up of only the maximum element of this instance.
MAX_BIGINTS - Static variable in class com.cloudera.crunch.CombineFn
 
MAX_BIGINTS() - Static method in class com.cloudera.crunch.CombineFn
 
MAX_BIGINTS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MAX_DOUBLES - Static variable in class com.cloudera.crunch.CombineFn
 
MAX_DOUBLES() - Static method in class com.cloudera.crunch.CombineFn
 
MAX_DOUBLES(int) - Static method in class com.cloudera.crunch.CombineFn
 
MAX_FLOATS - Static variable in class com.cloudera.crunch.CombineFn
 
MAX_FLOATS() - Static method in class com.cloudera.crunch.CombineFn
 
MAX_FLOATS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MAX_INTS - Static variable in class com.cloudera.crunch.CombineFn
 
MAX_INTS() - Static method in class com.cloudera.crunch.CombineFn
 
MAX_INTS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MAX_LONGS - Static variable in class com.cloudera.crunch.CombineFn
 
MAX_LONGS() - Static method in class com.cloudera.crunch.CombineFn
 
MAX_LONGS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MemCollection<S> - Class in com.cloudera.crunch.impl.mem.collect
 
MemCollection(Iterable<S>) - Constructor for class com.cloudera.crunch.impl.mem.collect.MemCollection
 
MemCollection(Iterable<S>, PType<S>) - Constructor for class com.cloudera.crunch.impl.mem.collect.MemCollection
 
MemCollection(Iterable<S>, PType<S>, String) - Constructor for class com.cloudera.crunch.impl.mem.collect.MemCollection
 
MemPipeline - Class in com.cloudera.crunch.impl.mem
 
MemTable<K,V> - Class in com.cloudera.crunch.impl.mem.collect
 
MemTable(Iterable<Pair<K, V>>) - Constructor for class com.cloudera.crunch.impl.mem.collect.MemTable
 
MemTable(Iterable<Pair<K, V>>, PTableType<K, V>, String) - Constructor for class com.cloudera.crunch.impl.mem.collect.MemTable
 
message - Variable in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
min() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
min() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
min(PCollection<S>) - Static method in class com.cloudera.crunch.lib.Aggregate
Returns the smallest numerical element from the input collection.
min() - Method in interface com.cloudera.crunch.PCollection
Returns a PCollection made up of only the minimum element of this instance.
MIN_BIGINTS - Static variable in class com.cloudera.crunch.CombineFn
 
MIN_BIGINTS() - Static method in class com.cloudera.crunch.CombineFn
 
MIN_BIGINTS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MIN_DOUBLES - Static variable in class com.cloudera.crunch.CombineFn
 
MIN_DOUBLES() - Static method in class com.cloudera.crunch.CombineFn
 
MIN_DOUBLES(int) - Static method in class com.cloudera.crunch.CombineFn
 
MIN_FLOATS - Static variable in class com.cloudera.crunch.CombineFn
 
MIN_FLOATS() - Static method in class com.cloudera.crunch.CombineFn
 
MIN_FLOATS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MIN_INTS - Static variable in class com.cloudera.crunch.CombineFn
 
MIN_INTS() - Static method in class com.cloudera.crunch.CombineFn
 
MIN_INTS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MIN_LONGS - Static variable in class com.cloudera.crunch.CombineFn
 
MIN_LONGS() - Static method in class com.cloudera.crunch.CombineFn
 
MIN_LONGS(int) - Static method in class com.cloudera.crunch.CombineFn
 
MRExecutor - Class in com.cloudera.crunch.impl.mr.exec
 
MRExecutor(Class<?>) - Constructor for class com.cloudera.crunch.impl.mr.exec.MRExecutor
 
MRPipeline - Class in com.cloudera.crunch.impl.mr
 
MRPipeline(Class<?>) - Constructor for class com.cloudera.crunch.impl.mr.MRPipeline
 
MRPipeline(Class<?>, Configuration) - Constructor for class com.cloudera.crunch.impl.mr.MRPipeline
 
MSCROutputHandler - Class in com.cloudera.crunch.impl.mr.plan
 
MSCROutputHandler(Job, Path, boolean) - Constructor for class com.cloudera.crunch.impl.mr.plan.MSCROutputHandler
 
MSCRPlanner - Class in com.cloudera.crunch.impl.mr.plan
 
MSCRPlanner(MRPipeline, Map<PCollectionImpl, Set<Target>>) - Constructor for class com.cloudera.crunch.impl.mr.plan.MSCRPlanner
 
MULTI_INPUTS - Static variable in class com.cloudera.crunch.impl.mr.run.RuntimeParameters
 
MULTI_OUTPUT_PREFIX - Static variable in class com.cloudera.crunch.impl.mr.plan.PlanningParameters
 
MultipleOutputEmitter<T,K,V> - Class in com.cloudera.crunch.impl.mr.emit
 
MultipleOutputEmitter(Converter, CrunchMultipleOutputs<K, V>, String) - Constructor for class com.cloudera.crunch.impl.mr.emit.MultipleOutputEmitter
 

N

newArrayList() - Static method in class com.cloudera.crunch.util.Collects
 
newArrayList(T...) - Static method in class com.cloudera.crunch.util.Collects
 
newArrayList(Iterable<? extends T>) - Static method in class com.cloudera.crunch.util.Collects
 
newArrayList(Iterator<? extends T>) - Static method in class com.cloudera.crunch.util.Collects
 
nextKeyValue() - Method in class com.cloudera.crunch.type.avro.AvroRecordReader
 
NodeContext - Enum in com.cloudera.crunch.impl.mr.run
Enum that is associated with a serialized DoNode instance, so we know how to use it within the context of a particular MR job.
not(FilterFn<S>) - Static method in class com.cloudera.crunch.FilterFn
 
nulls() - Static method in class com.cloudera.crunch.type.avro.Avros
 
nulls() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
nulls() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
nulls() - Static method in class com.cloudera.crunch.type.writable.Writables
 
nulls() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
numReducers(int) - Method in class com.cloudera.crunch.GroupingOptions.Builder
 

O

of(T, U) - Static method in class com.cloudera.crunch.Pair
 
of(A, B, C) - Static method in class com.cloudera.crunch.Tuple3
 
of(A, B, C, D) - Static method in class com.cloudera.crunch.Tuple4
 
or(FilterFn<S>...) - Static method in class com.cloudera.crunch.FilterFn
 
org.apache.hadoop.mapreduce.lib.jobcontrol - package org.apache.hadoop.mapreduce.lib.jobcontrol
 
org.apache.hadoop.mapreduce.lib.output - package org.apache.hadoop.mapreduce.lib.output
 
OutputEmitter<T,K,V> - Class in com.cloudera.crunch.impl.mr.emit
 
OutputEmitter(Converter<K, V, Object, Object>, TaskInputOutputContext<?, ?, K, V>) - Constructor for class com.cloudera.crunch.impl.mr.emit.OutputEmitter
 
OutputHandler - Interface in com.cloudera.crunch.io
 
outputKey(K) - Method in class com.cloudera.crunch.type.avro.AvroKeyConverter
 
outputKey(Pair<K, V>) - Method in class com.cloudera.crunch.type.avro.AvroPairConverter
 
outputKey(S) - Method in interface com.cloudera.crunch.type.Converter
 
outputKey(Pair<K, V>) - Method in class com.cloudera.crunch.type.writable.WritablePairConverter
 
outputValue(K) - Method in class com.cloudera.crunch.type.avro.AvroKeyConverter
 
outputValue(Pair<K, V>) - Method in class com.cloudera.crunch.type.avro.AvroPairConverter
 
outputValue(S) - Method in interface com.cloudera.crunch.type.Converter
 
outputValue(Pair<K, V>) - Method in class com.cloudera.crunch.type.writable.WritablePairConverter
 

P

Pair<K,V> - Class in com.cloudera.crunch
A convenience class for two-element Tuples.
Pair(K, V) - Constructor for class com.cloudera.crunch.Pair
 
PAIR - Static variable in class com.cloudera.crunch.type.TupleFactory
 
pairAggregator(CombineFn.AggregatorFactory<V1>, CombineFn.AggregatorFactory<V2>) - Static method in class com.cloudera.crunch.CombineFn
 
PairMapFn<K,V,S,T> - Class in com.cloudera.crunch.fn
 
PairMapFn(MapFn<K, S>, MapFn<V, T>) - Constructor for class com.cloudera.crunch.fn.PairMapFn
 
pairs(PType<V1>, PType<V2>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
pairs(PType<V1>, PType<V2>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
pairs(PType<V1>, PType<V2>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
pairs(PType<V1>, PType<V2>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
pairs(PType<V1>, PType<V2>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
parallelDo(DoFn<S, T>, PType<T>) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
parallelDo(String, DoFn<S, T>, PType<T>) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
parallelDo(DoFn<S, Pair<K, V>>, PTableType<K, V>) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
parallelDo(String, DoFn<S, Pair<K, V>>, PTableType<K, V>) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
parallelDo(DoFn<S, T>, PType<T>) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
parallelDo(String, DoFn<S, T>, PType<T>) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
parallelDo(DoFn<S, Pair<K, V>>, PTableType<K, V>) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
parallelDo(String, DoFn<S, Pair<K, V>>, PTableType<K, V>) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
parallelDo(DoFn<S, T>, PType<T>) - Method in interface com.cloudera.crunch.PCollection
Applies the given doFn to the elements of this PCollection and returns a new PCollection that is the output of this processing.
parallelDo(String, DoFn<S, T>, PType<T>) - Method in interface com.cloudera.crunch.PCollection
Applies the given doFn to the elements of this PCollection and returns a new PCollection that is the output of this processing.
parallelDo(DoFn<S, Pair<K, V>>, PTableType<K, V>) - Method in interface com.cloudera.crunch.PCollection
Similar to the other parallelDo instance, but returns a PTable instance instead of a PCollection.
parallelDo(String, DoFn<S, Pair<K, V>>, PTableType<K, V>) - Method in interface com.cloudera.crunch.PCollection
Similar to the other parallelDo instance, but returns a PTable instance instead of a PCollection.
partitionerClass(Class<? extends Partitioner>) - Method in class com.cloudera.crunch.GroupingOptions.Builder
 
path - Variable in class com.cloudera.crunch.io.impl.FileSourceImpl
 
path - Variable in class com.cloudera.crunch.io.impl.FileTargetImpl
 
PathTarget - Interface in com.cloudera.crunch.io
 
PathTargetImpl - Class in com.cloudera.crunch.io
 
PathTargetImpl(String, Class<OutputFormat>, Class, Class) - Constructor for class com.cloudera.crunch.io.PathTargetImpl
 
PathTargetImpl(Path, Class<OutputFormat>, Class, Class) - Constructor for class com.cloudera.crunch.io.PathTargetImpl
 
PCollection<S> - Interface in com.cloudera.crunch
A representation of an immutable, distributed collection of elements that is the fundamental target of computations in Crunch.
PCollectionImpl<S> - Class in com.cloudera.crunch.impl.mr.collect
 
PCollectionImpl(String) - Constructor for class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
PCollectionImpl.Visitor - Interface in com.cloudera.crunch.impl.mr.collect
 
PGroupedTable<K,V> - Interface in com.cloudera.crunch
The Crunch representation of a grouped PTable.
PGroupedTableImpl<K,V> - Class in com.cloudera.crunch.impl.mr.collect
 
PGroupedTableType<K,V> - Class in com.cloudera.crunch.type
The PType instance for PGroupedTable instances.
PGroupedTableType(PTableType<K, V>) - Constructor for class com.cloudera.crunch.type.PGroupedTableType
 
PGroupedTableType.PairIterableMapFn<K,V> - Class in com.cloudera.crunch.type
 
PGroupedTableType.PairIterableMapFn(MapFn<Object, K>, MapFn<Object, V>) - Constructor for class com.cloudera.crunch.type.PGroupedTableType.PairIterableMapFn
 
PGroupedTableType.PTypeIterable<V> - Class in com.cloudera.crunch.type
 
PGroupedTableType.PTypeIterable(MapFn<Object, V>, Iterable<Object>) - Constructor for class com.cloudera.crunch.type.PGroupedTableType.PTypeIterable
 
pipeline - Variable in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
Pipeline - Interface in com.cloudera.crunch
Manages the state of a pipeline execution.
plan(Class<?>, Configuration) - Method in class com.cloudera.crunch.impl.mr.plan.MSCRPlanner
 
PlanningParameters - Class in com.cloudera.crunch.impl.mr.plan
 
process(Pair<K, Iterable<V>>, Emitter<Pair<K, V>>) - Method in class com.cloudera.crunch.CombineFn.AggregatorCombineFn
 
process(S, Emitter<T>) - Method in class com.cloudera.crunch.DoFn
Processes the records from a PCollection.
process(T, Emitter<T>) - Method in class com.cloudera.crunch.FilterFn
 
process(Pair<K1, V>, Emitter<Pair<K2, V>>) - Method in class com.cloudera.crunch.fn.MapKeysFn
 
process(Pair<K, V1>, Emitter<Pair<K, V2>>) - Method in class com.cloudera.crunch.fn.MapValuesFn
 
process(Object) - Method in class com.cloudera.crunch.impl.mr.run.RTNode
 
process(Object, Object) - Method in class com.cloudera.crunch.impl.mr.run.RTNode
 
process(Pair<Boolean, Iterable<Pair<K, V>>>, Emitter<Pair<Boolean, Pair<K, V>>>) - Method in class com.cloudera.crunch.lib.Aggregate.TopKCombineFn
 
process(Pair<K, V>, Emitter<Pair<Boolean, Pair<K, V>>>) - Method in class com.cloudera.crunch.lib.Aggregate.TopKFn
 
process(S, Emitter<S>) - Method in class com.cloudera.crunch.lib.Sample.SamplerFn
 
process(S, Emitter<T>) - Method in class com.cloudera.crunch.MapFn
 
processIterable(Object, Iterable) - Method in class com.cloudera.crunch.impl.mr.run.RTNode
 
progress() - Method in class com.cloudera.crunch.DoFn
 
protos(Class<T>, PTypeFamily) - Static method in class com.cloudera.crunch.util.PTypes
 
PTable<K,V> - Interface in com.cloudera.crunch
A sub-interface of PCollection that represents an immutable, distributed multi-map of keys and values.
PTableBase<K,V> - Class in com.cloudera.crunch.impl.mr.collect
 
PTableBase(String) - Constructor for class com.cloudera.crunch.impl.mr.collect.PTableBase
 
PTables - Class in com.cloudera.crunch.lib
Methods for performing common operations on PTables.
PTables() - Constructor for class com.cloudera.crunch.lib.PTables
 
PTableType<K,V> - Interface in com.cloudera.crunch.type
An extension of PType specifically for PTable objects.
ptype - Variable in class com.cloudera.crunch.io.impl.FileSourceImpl
 
PType<T> - Interface in com.cloudera.crunch.type
A PType defines a mapping between a data type that is used in a Crunch pipeline and a serialization and storage format that is used to read/write data from/to HDFS.
PTypeFamily - Interface in com.cloudera.crunch.type
An abstract factory for creating PType instances that have the same serialization/storage backing format.
PTypes - Class in com.cloudera.crunch.util
Utility functions for creating common types of derived PTypes, e.g., for JSON data, protocol buffers, and Thrift records.
PTypes() - Constructor for class com.cloudera.crunch.util.PTypes
 
PTypes.JacksonInputMapFn<T> - Class in com.cloudera.crunch.util
 
PTypes.JacksonInputMapFn(Class<T>) - Constructor for class com.cloudera.crunch.util.PTypes.JacksonInputMapFn
 
PTypes.JacksonOutputMapFn<T> - Class in com.cloudera.crunch.util
 
PTypes.JacksonOutputMapFn() - Constructor for class com.cloudera.crunch.util.PTypes.JacksonOutputMapFn
 
PTypes.ProtoInputMapFn<T extends com.google.protobuf.Message> - Class in com.cloudera.crunch.util
 
PTypes.ProtoInputMapFn(Class<T>) - Constructor for class com.cloudera.crunch.util.PTypes.ProtoInputMapFn
 
PTypes.ProtoOutputMapFn<T extends com.google.protobuf.Message> - Class in com.cloudera.crunch.util
 
PTypes.ProtoOutputMapFn() - Constructor for class com.cloudera.crunch.util.PTypes.ProtoOutputMapFn
 
PTypes.SmileInputMapFn<T> - Class in com.cloudera.crunch.util
 
PTypes.SmileInputMapFn(Class<T>) - Constructor for class com.cloudera.crunch.util.PTypes.SmileInputMapFn
 
PTypes.SmileOutputMapFn<T> - Class in com.cloudera.crunch.util
 
PTypes.SmileOutputMapFn() - Constructor for class com.cloudera.crunch.util.PTypes.SmileOutputMapFn
 
PTypes.ThriftInputMapFn<T extends org.apache.thrift.TBase> - Class in com.cloudera.crunch.util
 
PTypes.ThriftInputMapFn(Class<T>) - Constructor for class com.cloudera.crunch.util.PTypes.ThriftInputMapFn
 
PTypes.ThriftOutputMapFn<T extends org.apache.thrift.TBase> - Class in com.cloudera.crunch.util
 
PTypes.ThriftOutputMapFn() - Constructor for class com.cloudera.crunch.util.PTypes.ThriftOutputMapFn
 
PTypeUtils - Class in com.cloudera.crunch.type
Utilities for converting between PTypes from different PTypeFamily implementations.
put(Text, T) - Method in class com.cloudera.crunch.type.writable.TextMapWritable
 

Q

quadAggregator(CombineFn.AggregatorFactory<A>, CombineFn.AggregatorFactory<B>, CombineFn.AggregatorFactory<C>, CombineFn.AggregatorFactory<D>) - Static method in class com.cloudera.crunch.CombineFn
 
quads(PType<V1>, PType<V2>, PType<V3>, PType<V4>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
quads(PType<V1>, PType<V2>, PType<V3>, PType<V4>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
quads(PType<V1>, PType<V2>, PType<V3>, PType<V4>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
quads(PType<V1>, PType<V2>, PType<V3>, PType<V4>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
quads(PType<V1>, PType<V2>, PType<V3>, PType<V4>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 

R

read(Source<T>) - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
read(TableSource<K, V>) - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
read(Source<S>) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
read(TableSource<K, V>) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
read(FileSystem, Path) - Method in class com.cloudera.crunch.io.avro.AvroFileReaderFactory
 
read(Configuration) - Method in class com.cloudera.crunch.io.avro.AvroFileSource
 
read(FileSystem, Path) - Method in interface com.cloudera.crunch.io.FileReaderFactory
 
read(Configuration) - Method in class com.cloudera.crunch.io.impl.ReadableSourcePathTargetImpl
 
read(Configuration) - Method in class com.cloudera.crunch.io.impl.ReadableSourceTargetImpl
 
read(Configuration) - Method in interface com.cloudera.crunch.io.ReadableSource
 
read(FileSystem, Path) - Method in class com.cloudera.crunch.io.seq.SeqFileReaderFactory
 
read(Configuration) - Method in class com.cloudera.crunch.io.seq.SeqFileSource
 
read(FileSystem, Path) - Method in class com.cloudera.crunch.io.seq.SeqFileTableReaderFactory
 
read(Configuration) - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
read() - Method in class com.cloudera.crunch.io.text.CBZip2InputStream
 
read(FileSystem, Path) - Method in class com.cloudera.crunch.io.text.TextFileReaderFactory
 
read(Configuration) - Method in class com.cloudera.crunch.io.text.TextFileSource
 
read(Source<T>) - Method in interface com.cloudera.crunch.Pipeline
Converts the given Source into a PCollection that is available to jobs run using this Pipeline instance.
read(TableSource<K, V>) - Method in interface com.cloudera.crunch.Pipeline
A version of the read method for TableSource instances that map to PTables.
read(Source<T>) - Method in class com.cloudera.crunch.tool.CrunchTool
 
read(TableSource<K, V>) - Method in class com.cloudera.crunch.tool.CrunchTool
 
read(Configuration, Path) - Static method in class com.cloudera.crunch.util.DistCache
 
ReadableSource<T> - Interface in com.cloudera.crunch.io
 
ReadableSourcePathTargetImpl<T> - Class in com.cloudera.crunch.io.impl
 
ReadableSourcePathTargetImpl(ReadableSource<T>, PathTarget) - Constructor for class com.cloudera.crunch.io.impl.ReadableSourcePathTargetImpl
 
ReadableSourceTarget<T> - Interface in com.cloudera.crunch.io
An interface that indicates that a SourceTarget instance can be read into the local client.
ReadableSourceTargetImpl<T> - Class in com.cloudera.crunch.io.impl
 
ReadableSourceTargetImpl(ReadableSource<T>, Target) - Constructor for class com.cloudera.crunch.io.impl.ReadableSourceTargetImpl
 
readFields(DataInput) - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
readFields(DataInput) - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
readFields(DataInput) - Method in class com.cloudera.crunch.type.writable.TextMapWritable
 
readFields(DataInput) - Method in class com.cloudera.crunch.type.writable.TupleWritable
readTextFile(String) - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
readTextFile(String) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
readTextFile(String) - Method in interface com.cloudera.crunch.Pipeline
A convenience method for reading a text file.
readTextFile(String) - Method in class com.cloudera.crunch.tool.CrunchTool
 
records(Class<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
records(Class<T>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
records(Class<T>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
records(Class<T>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
records(Class<T>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
reduce(Object, Iterable<Object>, Reducer<Object, Object, Object, Object>.Context) - Method in class com.cloudera.crunch.impl.mr.run.CrunchReducer
 
REFLECT_DATA_FACTORY - Static variable in class com.cloudera.crunch.type.avro.Avros
The instance we use for generating reflected schemas.
ReflectDataFactory - Class in com.cloudera.crunch.type.avro
A Factory class for constructing Avro reflection-related objects.
ReflectDataFactory() - Constructor for class com.cloudera.crunch.type.avro.ReflectDataFactory
 
reflects(Class<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
register(Class<T>, AvroType<T>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
register(Class<T>, WritableType<T, ?>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
reset() - Method in interface com.cloudera.crunch.CombineFn.Aggregator
Clears the internal state of this Aggregator and prepares it for the values associated with the next key.
reset() - Method in class com.cloudera.crunch.CombineFn.FirstNAggregator
 
reset() - Method in class com.cloudera.crunch.CombineFn.LastNAggregator
 
reset() - Method in class com.cloudera.crunch.CombineFn.MaxBigInts
 
reset() - Method in class com.cloudera.crunch.CombineFn.MaxDoubles
 
reset() - Method in class com.cloudera.crunch.CombineFn.MaxFloats
 
reset() - Method in class com.cloudera.crunch.CombineFn.MaxInts
 
reset() - Method in class com.cloudera.crunch.CombineFn.MaxLongs
 
reset() - Method in class com.cloudera.crunch.CombineFn.MaxNAggregator
 
reset() - Method in class com.cloudera.crunch.CombineFn.MinBigInts
 
reset() - Method in class com.cloudera.crunch.CombineFn.MinDoubles
 
reset() - Method in class com.cloudera.crunch.CombineFn.MinFloats
 
reset() - Method in class com.cloudera.crunch.CombineFn.MinInts
 
reset() - Method in class com.cloudera.crunch.CombineFn.MinLongs
 
reset() - Method in class com.cloudera.crunch.CombineFn.MinNAggregator
 
reset() - Method in class com.cloudera.crunch.CombineFn.SumBigInts
 
reset() - Method in class com.cloudera.crunch.CombineFn.SumDoubles
 
reset() - Method in class com.cloudera.crunch.CombineFn.SumFloats
 
reset() - Method in class com.cloudera.crunch.CombineFn.SumInts
 
reset() - Method in class com.cloudera.crunch.CombineFn.SumLongs
 
results() - Method in interface com.cloudera.crunch.CombineFn.Aggregator
Returns the current aggregated state of this instance.
results() - Method in class com.cloudera.crunch.CombineFn.FirstNAggregator
 
results() - Method in class com.cloudera.crunch.CombineFn.LastNAggregator
 
results() - Method in class com.cloudera.crunch.CombineFn.MaxBigInts
 
results() - Method in class com.cloudera.crunch.CombineFn.MaxDoubles
 
results() - Method in class com.cloudera.crunch.CombineFn.MaxFloats
 
results() - Method in class com.cloudera.crunch.CombineFn.MaxInts
 
results() - Method in class com.cloudera.crunch.CombineFn.MaxLongs
 
results() - Method in class com.cloudera.crunch.CombineFn.MaxNAggregator
 
results() - Method in class com.cloudera.crunch.CombineFn.MinBigInts
 
results() - Method in class com.cloudera.crunch.CombineFn.MinDoubles
 
results() - Method in class com.cloudera.crunch.CombineFn.MinFloats
 
results() - Method in class com.cloudera.crunch.CombineFn.MinInts
 
results() - Method in class com.cloudera.crunch.CombineFn.MinLongs
 
results() - Method in class com.cloudera.crunch.CombineFn.MinNAggregator
 
results() - Method in class com.cloudera.crunch.CombineFn.PairAggregator
 
results() - Method in class com.cloudera.crunch.CombineFn.QuadAggregator
 
results() - Method in class com.cloudera.crunch.CombineFn.SumBigInts
 
results() - Method in class com.cloudera.crunch.CombineFn.SumDoubles
 
results() - Method in class com.cloudera.crunch.CombineFn.SumFloats
 
results() - Method in class com.cloudera.crunch.CombineFn.SumInts
 
results() - Method in class com.cloudera.crunch.CombineFn.SumLongs
 
results() - Method in class com.cloudera.crunch.CombineFn.TripAggregator
 
results() - Method in class com.cloudera.crunch.CombineFn.TupleNAggregator
 
resume() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
resume the suspended thread
RTNode - Class in com.cloudera.crunch.impl.mr.run
 
RTNode(DoFn<Object, Object>, String, List<RTNode>, Converter, Converter, String) - Constructor for class com.cloudera.crunch.impl.mr.run.RTNode
 
run() - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
run() - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
run() - Method in interface com.cloudera.crunch.Pipeline
Constructs and executes a series of MapReduce jobs in order to write data to the output targets.
run() - Method in class com.cloudera.crunch.tool.CrunchTool
 
run() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
The main loop for the thread.
RuntimeParameters - Class in com.cloudera.crunch.impl.mr.run
Parameters used during the runtime execution.

S

SafeAvroSerialization<T> - Class in com.cloudera.crunch.type.avro
The Serialization used by jobs configured with AvroJob.
SafeAvroSerialization() - Constructor for class com.cloudera.crunch.type.avro.SafeAvroSerialization
 
sample(double) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
sample(double, long) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
sample(double) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
sample(double, long) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
Sample - Class in com.cloudera.crunch.lib
 
Sample() - Constructor for class com.cloudera.crunch.lib.Sample
 
sample(PCollection<S>, double) - Static method in class com.cloudera.crunch.lib.Sample
 
sample(PCollection<S>, long, double) - Static method in class com.cloudera.crunch.lib.Sample
 
sample(double) - Method in interface com.cloudera.crunch.PCollection
Randomly sample items from this PCollection instance with the given probability of an item being accepted.
sample(double, long) - Method in interface com.cloudera.crunch.PCollection
Randomly sample items from this PCollection instance with the given probability of an item being accepted and using the given seed.
Sample.SamplerFn<S> - Class in com.cloudera.crunch.lib
 
Sample.SamplerFn(long, double) - Constructor for class com.cloudera.crunch.lib.Sample.SamplerFn
 
scaleFactor() - Method in class com.cloudera.crunch.DoFn
Returns an estimate of how applying this function to a PCollection will cause it to change in side.
scaleFactor() - Method in class com.cloudera.crunch.FilterFn.AndFn
 
scaleFactor() - Method in class com.cloudera.crunch.FilterFn.NotFn
 
scaleFactor() - Method in class com.cloudera.crunch.FilterFn.OrFn
 
scaleFactor() - Method in class com.cloudera.crunch.FilterFn
 
scaleFactor() - Method in class com.cloudera.crunch.MapFn
 
scan - Variable in class com.cloudera.crunch.io.hbase.HBaseSourceTarget
 
second() - Method in class com.cloudera.crunch.Pair
 
second() - Method in class com.cloudera.crunch.Tuple3
 
second() - Method in class com.cloudera.crunch.Tuple4
 
SeqFileHelper - Class in com.cloudera.crunch.io.seq
 
SeqFileHelper() - Constructor for class com.cloudera.crunch.io.seq.SeqFileHelper
 
SeqFileReaderFactory<T> - Class in com.cloudera.crunch.io.seq
 
SeqFileReaderFactory(PType<T>, Configuration) - Constructor for class com.cloudera.crunch.io.seq.SeqFileReaderFactory
 
SeqFileSource<T> - Class in com.cloudera.crunch.io.seq
 
SeqFileSource(Path, PType<T>) - Constructor for class com.cloudera.crunch.io.seq.SeqFileSource
 
SeqFileSourceTarget<T> - Class in com.cloudera.crunch.io.seq
 
SeqFileSourceTarget(String, PType<T>) - Constructor for class com.cloudera.crunch.io.seq.SeqFileSourceTarget
 
SeqFileSourceTarget(Path, PType<T>) - Constructor for class com.cloudera.crunch.io.seq.SeqFileSourceTarget
 
SeqFileTableReaderFactory<K,V> - Class in com.cloudera.crunch.io.seq
 
SeqFileTableReaderFactory(PTableType<K, V>, Configuration) - Constructor for class com.cloudera.crunch.io.seq.SeqFileTableReaderFactory
 
SeqFileTableSourceTarget<K,V> - Class in com.cloudera.crunch.io.seq
 
SeqFileTableSourceTarget(String, PTableType<K, V>) - Constructor for class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
SeqFileTableSourceTarget(Path, PTableType<K, V>) - Constructor for class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
SeqFileTarget - Class in com.cloudera.crunch.io.seq
 
SeqFileTarget(String) - Constructor for class com.cloudera.crunch.io.seq.SeqFileTarget
 
SeqFileTarget(Path) - Constructor for class com.cloudera.crunch.io.seq.SeqFileTarget
 
sequenceFile(String, PType<T>) - Static method in class com.cloudera.crunch.io.At
 
sequenceFile(Path, PType<T>) - Static method in class com.cloudera.crunch.io.At
 
sequenceFile(String, PType<K>, PType<V>) - Static method in class com.cloudera.crunch.io.At
 
sequenceFile(Path, PType<K>, PType<V>) - Static method in class com.cloudera.crunch.io.At
 
sequenceFile(String, PType<T>) - Static method in class com.cloudera.crunch.io.From
 
sequenceFile(Path, PType<T>) - Static method in class com.cloudera.crunch.io.From
 
sequenceFile(String, PType<K>, PType<V>) - Static method in class com.cloudera.crunch.io.From
 
sequenceFile(Path, PType<K>, PType<V>) - Static method in class com.cloudera.crunch.io.From
 
sequenceFile(String) - Static method in class com.cloudera.crunch.io.To
 
sequenceFile(Path) - Static method in class com.cloudera.crunch.io.To
 
Set - Class in com.cloudera.crunch.lib
Utilities for performing set operations (difference, intersection, etc) on PCollection instances.
Set() - Constructor for class com.cloudera.crunch.lib.Set
 
set(Writable[]) - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
setConf(Configuration) - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
setConf(Configuration) - Method in class com.cloudera.crunch.lib.JoinUtils.AvroPairGroupingComparator
 
setConf(Configuration) - Method in class com.cloudera.crunch.tool.CrunchTool
 
setConfiguration(Configuration) - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
setConfiguration(Configuration) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
setConfiguration(Configuration) - Method in interface com.cloudera.crunch.Pipeline
Set the Configuration to use with this pipeline.
setConfigurationForTest(Configuration) - Method in class com.cloudera.crunch.DoFn
Sets a Configuration instance to be used during unit tests.
setContext(TaskInputOutputContext<?, ?, ?, ?>) - Method in class com.cloudera.crunch.DoFn
Called during setup to pass the TaskInputOutputContext to this DoFn instance.
setCountersEnabled(Job, boolean) - Static method in class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Enables or disables counters for the named outputs.
setJob(Job) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Set the mapreduce job
setJobID(String) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Set the job ID for this job.
setJobName(String) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Set the job name for this job.
setJobState(ControlledJob.State) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Set the state for this job.
setMessage(String) - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Set the message for this job.
setOutputName(String) - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
setReadLimit(long) - Method in class com.cloudera.crunch.io.text.CBZip2InputStream
 
setStatus(String) - Method in class com.cloudera.crunch.DoFn
 
setup(Mapper<Object, Object, Object, Object>.Context) - Method in class com.cloudera.crunch.impl.mr.run.CrunchMapper
 
setup(Reducer<Object, Object, Object, Object>.Context) - Method in class com.cloudera.crunch.impl.mr.run.CrunchReducer
 
setValueType(String) - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
setWritten(int) - Method in class com.cloudera.crunch.type.writable.TupleWritable
Record that the tuple contains an element at the position provided.
size() - Method in class com.cloudera.crunch.Pair
 
size() - Method in interface com.cloudera.crunch.Tuple
Returns the number of elements in this Tuple.
size() - Method in class com.cloudera.crunch.Tuple3
 
size() - Method in class com.cloudera.crunch.Tuple4
 
size() - Method in class com.cloudera.crunch.TupleN
 
size() - Method in class com.cloudera.crunch.type.writable.TupleWritable
The number of children in this Tuple.
smile(Class<T>, PTypeFamily) - Static method in class com.cloudera.crunch.util.PTypes
 
sort(boolean) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
sort(boolean) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
Sort - Class in com.cloudera.crunch.lib
Utilities for sorting PCollection instances.
Sort() - Constructor for class com.cloudera.crunch.lib.Sort
 
sort(PCollection<T>) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PCollection using the natural ordering of its elements.
sort(PCollection<T>, Sort.Order) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PCollection using the natural ordering of its elements in the order specified.
sort(PTable<K, V>) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PTable using the natural ordering of its keys.
sort(PTable<K, V>, Sort.Order) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PTable using the natural ordering of its keys in the order specified.
sort(boolean) - Method in interface com.cloudera.crunch.PCollection
Returns a PCollection instance that contains all of the elements of this instance in sorted order.
Sort.ColumnOrder - Class in com.cloudera.crunch.lib
To sort by column 2 ascending then column 1 descending, you would use: sortPairs(coll, by(2, ASCENDING), by(1, DESCENDING)) Column numbering is 1-based.
Sort.ColumnOrder(int, Sort.Order) - Constructor for class com.cloudera.crunch.lib.Sort.ColumnOrder
 
Sort.Order - Enum in com.cloudera.crunch.lib
 
sortComparatorClass(Class<? extends RawComparator>) - Method in class com.cloudera.crunch.GroupingOptions.Builder
 
sortPairs(PCollection<Pair<U, V>>, Sort.ColumnOrder...) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PCollection of Pairs using the specified column ordering.
sortQuads(PCollection<Tuple4<V1, V2, V3, V4>>, Sort.ColumnOrder...) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PCollection of Tuple4s using the specified column ordering.
sortTriples(PCollection<Tuple3<V1, V2, V3>>, Sort.ColumnOrder...) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PCollection of Tuple3s using the specified column ordering.
sortTuples(PCollection<TupleN>, Sort.ColumnOrder...) - Static method in class com.cloudera.crunch.lib.Sort
Sorts the PCollection of TupleNs using the specified column ordering.
source - Variable in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
Source<T> - Interface in com.cloudera.crunch
A Source represents an input data set that is an input to one or more MapReduce jobs.
SourcePathTargetImpl<T> - Class in com.cloudera.crunch.io.impl
 
SourcePathTargetImpl(Source<T>, PathTarget) - Constructor for class com.cloudera.crunch.io.impl.SourcePathTargetImpl
 
SourceTarget<T> - Interface in com.cloudera.crunch
An interface for classes that implement both the Source and the Target interfaces.
SourceTargetHelper - Class in com.cloudera.crunch.io
Functions for configuring the inputs/outputs of MapReduce jobs.
SourceTargetHelper() - Constructor for class com.cloudera.crunch.io.SourceTargetHelper
 
SourceTargetImpl<T> - Class in com.cloudera.crunch.io.impl
 
SourceTargetImpl(Source<T>, Target) - Constructor for class com.cloudera.crunch.io.impl.SourceTargetImpl
 
state - Variable in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
stop() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
set the thread state to STOPPING so that the thread will stop when it wakes up.
STRING_TO_UTF8 - Static variable in class com.cloudera.crunch.type.avro.Avros
 
strings() - Static method in class com.cloudera.crunch.type.avro.Avros
 
strings() - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
strings() - Method in interface com.cloudera.crunch.type.PTypeFamily
 
strings() - Static method in class com.cloudera.crunch.type.writable.Writables
 
strings() - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
submit() - Method in class com.cloudera.crunch.impl.mr.exec.CrunchJob
 
submit() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
Submit this job to mapred.
SUM_BIGINTS - Static variable in class com.cloudera.crunch.CombineFn
 
SUM_BIGINTS() - Static method in class com.cloudera.crunch.CombineFn
 
SUM_DOUBLES - Static variable in class com.cloudera.crunch.CombineFn
 
SUM_DOUBLES() - Static method in class com.cloudera.crunch.CombineFn
 
SUM_FLOATS - Static variable in class com.cloudera.crunch.CombineFn
 
SUM_FLOATS() - Static method in class com.cloudera.crunch.CombineFn
 
SUM_INTS - Static variable in class com.cloudera.crunch.CombineFn
 
SUM_INTS() - Static method in class com.cloudera.crunch.CombineFn
 
SUM_LONGS - Static variable in class com.cloudera.crunch.CombineFn
 
SUM_LONGS() - Static method in class com.cloudera.crunch.CombineFn
 
suspend() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl
suspend the running thread

T

table - Variable in class com.cloudera.crunch.io.hbase.HBaseTarget
 
tableOf(S, T, Object...) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
tableOf(Iterable<Pair<S, T>>) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
tableOf(PType<K>, PType<V>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
tableOf(PType<K>, PType<V>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
tableOf(PType<K>, PType<V>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
tableOf(PType<K>, PType<V>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
tableOf(PType<K>, PType<V>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
TableSource<K,V> - Interface in com.cloudera.crunch
The interface Source implementations that return a PTable.
TableSourcePathTargetImpl<K,V> - Class in com.cloudera.crunch.io.impl
 
TableSourcePathTargetImpl(TableSource<K, V>, PathTarget) - Constructor for class com.cloudera.crunch.io.impl.TableSourcePathTargetImpl
 
TableSourceTargetImpl<K,V> - Class in com.cloudera.crunch.io.impl
 
TableSourceTargetImpl(TableSource<K, V>, Target) - Constructor for class com.cloudera.crunch.io.impl.TableSourceTargetImpl
 
tableType - Variable in class com.cloudera.crunch.type.PGroupedTableType
 
target - Variable in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
Target - Interface in com.cloudera.crunch
A Target represents the output destination of a Crunch job.
TestCounters - Class in com.cloudera.crunch.test
A utility class used during unit testing to update and read counters.
TestCounters() - Constructor for class com.cloudera.crunch.test.TestCounters
 
textFile(String) - Static method in class com.cloudera.crunch.io.At
 
textFile(Path) - Static method in class com.cloudera.crunch.io.At
 
textFile(String, PType<T>) - Static method in class com.cloudera.crunch.io.At
 
textFile(Path, PType<T>) - Static method in class com.cloudera.crunch.io.At
 
textFile(String) - Static method in class com.cloudera.crunch.io.From
 
textFile(Path) - Static method in class com.cloudera.crunch.io.From
 
textFile(String, PType<T>) - Static method in class com.cloudera.crunch.io.From
 
textFile(Path, PType<T>) - Static method in class com.cloudera.crunch.io.From
 
textFile(String) - Static method in class com.cloudera.crunch.io.To
 
textFile(Path) - Static method in class com.cloudera.crunch.io.To
 
TextFileReaderFactory<T> - Class in com.cloudera.crunch.io.text
 
TextFileReaderFactory(PType<T>) - Constructor for class com.cloudera.crunch.io.text.TextFileReaderFactory
 
TextFileSource<T> - Class in com.cloudera.crunch.io.text
 
TextFileSource(Path, PType<T>) - Constructor for class com.cloudera.crunch.io.text.TextFileSource
 
TextFileSourceTarget<T> - Class in com.cloudera.crunch.io.text
 
TextFileSourceTarget(String, PType<T>) - Constructor for class com.cloudera.crunch.io.text.TextFileSourceTarget
 
TextFileSourceTarget(Path, PType<T>) - Constructor for class com.cloudera.crunch.io.text.TextFileSourceTarget
 
TextFileTarget - Class in com.cloudera.crunch.io.text
 
TextFileTarget(String) - Constructor for class com.cloudera.crunch.io.text.TextFileTarget
 
TextFileTarget(Path) - Constructor for class com.cloudera.crunch.io.text.TextFileTarget
 
TextMapWritable<T extends org.apache.hadoop.io.Writable> - Class in com.cloudera.crunch.type.writable
 
TextMapWritable() - Constructor for class com.cloudera.crunch.type.writable.TextMapWritable
 
TextMapWritable(Class<T>) - Constructor for class com.cloudera.crunch.type.writable.TextMapWritable
 
third() - Method in class com.cloudera.crunch.Tuple3
 
third() - Method in class com.cloudera.crunch.Tuple4
 
thrifts(Class<T>, PTypeFamily) - Static method in class com.cloudera.crunch.util.PTypes
 
To - Class in com.cloudera.crunch.io
Static factory methods for creating various Target types.
To() - Constructor for class com.cloudera.crunch.io.To
 
to - Static variable in class com.cloudera.crunch.tool.CrunchTool
 
top(int) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
top(int) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
top(PTable<K, V>, int, boolean) - Static method in class com.cloudera.crunch.lib.Aggregate
 
top(int) - Method in interface com.cloudera.crunch.PTable
Returns a PTable made up of the pairs in this PTable with the largest value field.
toRTNode(boolean, Configuration, NodeContext) - Method in class com.cloudera.crunch.impl.mr.plan.DoNode
 
toString() - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
toString() - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
toString() - Method in class com.cloudera.crunch.impl.mr.run.RTNode
 
toString() - Method in class com.cloudera.crunch.io.avro.AvroFileSource
 
toString() - Method in class com.cloudera.crunch.io.avro.AvroFileTarget
 
toString() - Method in class com.cloudera.crunch.io.impl.FileSourceImpl
 
toString() - Method in class com.cloudera.crunch.io.impl.FileTargetImpl
 
toString() - Method in class com.cloudera.crunch.io.impl.SourceTargetImpl
 
toString() - Method in class com.cloudera.crunch.io.seq.SeqFileSource
 
toString() - Method in class com.cloudera.crunch.io.seq.SeqFileTableSourceTarget
 
toString() - Method in class com.cloudera.crunch.io.seq.SeqFileTarget
 
toString() - Method in class com.cloudera.crunch.io.text.TextFileSourceTarget
 
toString() - Method in class com.cloudera.crunch.io.text.TextFileTarget
 
toString() - Method in class com.cloudera.crunch.lib.Sort.ColumnOrder
 
toString() - Method in class com.cloudera.crunch.Pair
 
toString() - Method in class com.cloudera.crunch.Tuple3
 
toString() - Method in class com.cloudera.crunch.Tuple4
 
toString() - Method in class com.cloudera.crunch.TupleN
 
toString() - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
toString() - Method in class com.cloudera.crunch.type.writable.TupleWritable
Convert Tuple to String as in the following.
toString() - Method in class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob
 
tripAggregator(CombineFn.AggregatorFactory<A>, CombineFn.AggregatorFactory<B>, CombineFn.AggregatorFactory<C>) - Static method in class com.cloudera.crunch.CombineFn
 
triples(PType<V1>, PType<V2>, PType<V3>) - Static method in class com.cloudera.crunch.type.avro.Avros
 
triples(PType<V1>, PType<V2>, PType<V3>) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
triples(PType<V1>, PType<V2>, PType<V3>) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
triples(PType<V1>, PType<V2>, PType<V3>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
triples(PType<V1>, PType<V2>, PType<V3>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
Tuple - Interface in com.cloudera.crunch
A fixed-size collection of Objects, used in Crunch for representing joins between PCollections.
Tuple3<V1,V2,V3> - Class in com.cloudera.crunch
A convenience class for three-element Tuples.
Tuple3(V1, V2, V3) - Constructor for class com.cloudera.crunch.Tuple3
 
TUPLE3 - Static variable in class com.cloudera.crunch.type.TupleFactory
 
Tuple4<V1,V2,V3,V4> - Class in com.cloudera.crunch
A convenience class for four-element Tuples.
Tuple4(V1, V2, V3, V4) - Constructor for class com.cloudera.crunch.Tuple4
 
TUPLE4 - Static variable in class com.cloudera.crunch.type.TupleFactory
 
tupleAggregator(CombineFn.AggregatorFactory<?>...) - Static method in class com.cloudera.crunch.CombineFn
 
TupleFactory<T extends Tuple> - Class in com.cloudera.crunch.type
 
TupleFactory() - Constructor for class com.cloudera.crunch.type.TupleFactory
 
TupleN - Class in com.cloudera.crunch
A Tuple instance for an arbitrary number of values.
TupleN(Object...) - Constructor for class com.cloudera.crunch.TupleN
 
TUPLEN - Static variable in class com.cloudera.crunch.type.TupleFactory
 
tuples(PType...) - Static method in class com.cloudera.crunch.type.avro.Avros
 
tuples(Class<T>, PType...) - Static method in class com.cloudera.crunch.type.avro.Avros
 
tuples(PType...) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
tuples(Class<T>, PType...) - Method in class com.cloudera.crunch.type.avro.AvroTypeFamily
 
tuples(PType...) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
tuples(Class<T>, PType...) - Method in interface com.cloudera.crunch.type.PTypeFamily
 
tuples(PType...) - Static method in class com.cloudera.crunch.type.writable.Writables
 
tuples(Class<T>, PType...) - Static method in class com.cloudera.crunch.type.writable.Writables
 
tuples(PType...) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
tuples(Class<T>, PType...) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
Tuples - Class in com.cloudera.crunch.util
Utilities for working with subclasses of the Tuple interface.
Tuples() - Constructor for class com.cloudera.crunch.util.Tuples
 
Tuples.PairIterable<S,T> - Class in com.cloudera.crunch.util
 
Tuples.PairIterable(Iterable<S>, Iterable<T>) - Constructor for class com.cloudera.crunch.util.Tuples.PairIterable
 
Tuples.QuadIterable<A,B,C,D> - Class in com.cloudera.crunch.util
 
Tuples.QuadIterable(Iterable<A>, Iterable<B>, Iterable<C>, Iterable<D>) - Constructor for class com.cloudera.crunch.util.Tuples.QuadIterable
 
Tuples.TripIterable<A,B,C> - Class in com.cloudera.crunch.util
 
Tuples.TripIterable(Iterable<A>, Iterable<B>, Iterable<C>) - Constructor for class com.cloudera.crunch.util.Tuples.TripIterable
 
Tuples.TupleNIterable - Class in com.cloudera.crunch.util
 
Tuples.TupleNIterable(Iterable...) - Constructor for class com.cloudera.crunch.util.Tuples.TupleNIterable
 
TupleWritable - Class in com.cloudera.crunch.type.writable
A straight copy of the TupleWritable implementation in the join package, added here because of its package visibility restrictions.
TupleWritable() - Constructor for class com.cloudera.crunch.type.writable.TupleWritable
Create an empty tuple with no allocated storage for writables.
TupleWritable(Writable[]) - Constructor for class com.cloudera.crunch.type.writable.TupleWritable
Initialize tuple with storage; unknown whether any of them contain "written" values.
typedCollectionOf(PType<T>, T...) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
typedCollectionOf(PType<T>, Iterable<T>) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
typedTableOf(PTableType<S, T>, S, T, Object...) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 
typedTableOf(PTableType<S, T>, Iterable<Pair<S, T>>) - Static method in class com.cloudera.crunch.impl.mem.MemPipeline
 

U

ungroup() - Method in class com.cloudera.crunch.impl.mr.collect.PGroupedTableImpl
 
ungroup() - Method in interface com.cloudera.crunch.PGroupedTable
Convert this grouping back into a multimap.
union(PCollection<S>...) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
union(PTable<K, V>...) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
union(PCollection<S>...) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
union(PTable<K, V>...) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
union(PCollection<S>...) - Method in interface com.cloudera.crunch.PCollection
Returns a PCollection instance that acts as the union of this PCollection and the input PCollections.
union(PTable<K, V>...) - Method in interface com.cloudera.crunch.PTable
Returns a PTable instance that acts as the union of this PTable and the input PTables.
UnionCollection<S> - Class in com.cloudera.crunch.impl.mr.collect
 
UnionTable<K,V> - Class in com.cloudera.crunch.impl.mr.collect
 
UnionTable(List<PTableBase<K, V>>) - Constructor for class com.cloudera.crunch.impl.mr.collect.UnionTable
 
update(T) - Method in interface com.cloudera.crunch.CombineFn.Aggregator
Incorporate the given value into the aggregate state maintained by this instance.
update(V) - Method in class com.cloudera.crunch.CombineFn.FirstNAggregator
 
update(V) - Method in class com.cloudera.crunch.CombineFn.LastNAggregator
 
update(BigInteger) - Method in class com.cloudera.crunch.CombineFn.MaxBigInts
 
update(Double) - Method in class com.cloudera.crunch.CombineFn.MaxDoubles
 
update(Float) - Method in class com.cloudera.crunch.CombineFn.MaxFloats
 
update(Integer) - Method in class com.cloudera.crunch.CombineFn.MaxInts
 
update(Long) - Method in class com.cloudera.crunch.CombineFn.MaxLongs
 
update(V) - Method in class com.cloudera.crunch.CombineFn.MaxNAggregator
 
update(BigInteger) - Method in class com.cloudera.crunch.CombineFn.MinBigInts
 
update(Double) - Method in class com.cloudera.crunch.CombineFn.MinDoubles
 
update(Float) - Method in class com.cloudera.crunch.CombineFn.MinFloats
 
update(Integer) - Method in class com.cloudera.crunch.CombineFn.MinInts
 
update(Long) - Method in class com.cloudera.crunch.CombineFn.MinLongs
 
update(V) - Method in class com.cloudera.crunch.CombineFn.MinNAggregator
 
update(Pair<V1, V2>) - Method in class com.cloudera.crunch.CombineFn.PairAggregator
 
update(Tuple4<A, B, C, D>) - Method in class com.cloudera.crunch.CombineFn.QuadAggregator
 
update(BigInteger) - Method in class com.cloudera.crunch.CombineFn.SumBigInts
 
update(Double) - Method in class com.cloudera.crunch.CombineFn.SumDoubles
 
update(Float) - Method in class com.cloudera.crunch.CombineFn.SumFloats
 
update(Integer) - Method in class com.cloudera.crunch.CombineFn.SumInts
 
update(Long) - Method in class com.cloudera.crunch.CombineFn.SumLongs
 
update(Tuple3<A, B, C>) - Method in class com.cloudera.crunch.CombineFn.TripAggregator
 
update(TupleN) - Method in class com.cloudera.crunch.CombineFn.TupleNAggregator
 
UTF8_TO_STRING - Static variable in class com.cloudera.crunch.type.avro.Avros
 

V

valueOf(String) - Static method in enum com.cloudera.crunch.impl.mr.run.NodeContext
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum com.cloudera.crunch.lib.Sort.Order
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State
Returns the enum constant of this type with the specified name.
valueOf(String) - Static method in enum org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl.ThreadState
Returns the enum constant of this type with the specified name.
values() - Static method in enum com.cloudera.crunch.impl.mr.run.NodeContext
Returns an array containing the constants of this enum type, in the order they are declared.
values(PTable<K, V>) - Static method in class com.cloudera.crunch.lib.PTables
 
values() - Static method in enum com.cloudera.crunch.lib.Sort.Order
Returns an array containing the constants of this enum type, in the order they are declared.
values() - Static method in enum org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State
Returns an array containing the constants of this enum type, in the order they are declared.
values() - Static method in enum org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl.ThreadState
Returns an array containing the constants of this enum type, in the order they are declared.
visit(DoNode) - Method in class com.cloudera.crunch.impl.mr.plan.JobNameBuilder
 
visit(List<DoNode>) - Method in class com.cloudera.crunch.impl.mr.plan.JobNameBuilder
 
visitDoFnCollection(DoCollectionImpl<?>) - Method in interface com.cloudera.crunch.impl.mr.collect.PCollectionImpl.Visitor
 
visitDoTable(DoTableImpl<?, ?>) - Method in interface com.cloudera.crunch.impl.mr.collect.PCollectionImpl.Visitor
 
visitGroupedTable(PGroupedTableImpl<?, ?>) - Method in interface com.cloudera.crunch.impl.mr.collect.PCollectionImpl.Visitor
 
visitInputCollection(InputCollection<?>) - Method in interface com.cloudera.crunch.impl.mr.collect.PCollectionImpl.Visitor
 
visitUnionCollection(UnionCollection<?>) - Method in interface com.cloudera.crunch.impl.mr.collect.PCollectionImpl.Visitor
 

W

wasLogged() - Method in exception com.cloudera.crunch.impl.mr.run.CrunchRuntimeException
 
WritableGroupedTableType<K,V> - Class in com.cloudera.crunch.type.writable
 
WritableGroupedTableType(WritableTableType<K, V>) - Constructor for class com.cloudera.crunch.type.writable.WritableGroupedTableType
 
WritablePairConverter<K,V> - Class in com.cloudera.crunch.type.writable
 
WritablePairConverter(Class<K>, Class<V>) - Constructor for class com.cloudera.crunch.type.writable.WritablePairConverter
 
Writables - Class in com.cloudera.crunch.type.writable
Defines static methods that are analogous to the methods defined in WritableTypeFamily for convenient static importing.
writables(Class<W>) - Static method in class com.cloudera.crunch.type.writable.Writables
 
writables(Class<W>) - Method in class com.cloudera.crunch.type.writable.WritableTypeFamily
 
WritableType<T,W> - Class in com.cloudera.crunch.type.writable
 
WritableTypeFamily - Class in com.cloudera.crunch.type.writable
The Writable-based implementation of the PTypeFamily interface.
write(Target) - Method in class com.cloudera.crunch.impl.mem.collect.MemCollection
 
write(Target) - Method in class com.cloudera.crunch.impl.mem.collect.MemTable
 
write(PCollection<?>, Target) - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
write(Target) - Method in class com.cloudera.crunch.impl.mr.collect.PCollectionImpl
 
write(Target) - Method in class com.cloudera.crunch.impl.mr.collect.PTableBase
 
write(PCollection<?>, Target) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
write(DataOutput) - Method in class com.cloudera.crunch.impl.mr.run.CrunchInputSplit
 
write(Target) - Method in interface com.cloudera.crunch.PCollection
Write the contents of this PCollection to the given Target, using the storage format specified by the target.
write(PCollection<?>, Target) - Method in interface com.cloudera.crunch.Pipeline
Write the given collection to the given target on the next pipeline run.
write(Target) - Method in interface com.cloudera.crunch.PTable
Writes this PTable to the given Target.
write(PCollection<?>, Target) - Method in class com.cloudera.crunch.tool.CrunchTool
 
write(DataOutput) - Method in class com.cloudera.crunch.type.writable.GenericArrayWritable
 
write(DataOutput) - Method in class com.cloudera.crunch.type.writable.TextMapWritable
 
write(DataOutput) - Method in class com.cloudera.crunch.type.writable.TupleWritable
Writes each Writable to out.
write(Configuration, Path, Object) - Static method in class com.cloudera.crunch.util.DistCache
 
write(String, K, V) - Method in class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Write key and value to the namedOutput.
write(String, K, V, String) - Method in class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Write key and value to baseOutputPath using the namedOutput.
write(KEYOUT, VALUEOUT, String) - Method in class org.apache.hadoop.mapreduce.lib.output.CrunchMultipleOutputs
Write key value to an output file name.
writeTextFile(PCollection<T>, String) - Method in class com.cloudera.crunch.impl.mem.MemPipeline
 
writeTextFile(PCollection<T>, String) - Method in class com.cloudera.crunch.impl.mr.MRPipeline
 
writeTextFile(PCollection<T>, String) - Method in interface com.cloudera.crunch.Pipeline
A convenience method for writing a text file.
writeTextFile(PCollection<?>, String) - Method in class com.cloudera.crunch.tool.CrunchTool
 

A B C D E F G H I J K L M N O P Q R S T U V W

Copyright © 2012. All Rights Reserved.