public final class SparkInput
extends java.lang.Object
| Modifier and Type | Method and Description |
|---|---|
static org.apache.spark.api.java.JavaRDD<org.openstreetmap.atlas.geography.atlas.Atlas> |
atlasFiles(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path)
Load Atlas files from an input path
|
static org.apache.spark.api.java.JavaPairRDD<java.lang.String,org.apache.spark.input.PortableDataStream> |
binaryFile(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path)
Get an RDD from a binary file input
|
static <K extends org.apache.hadoop.io.Writable,V extends org.apache.hadoop.io.Writable> |
sequenceFile(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path,
java.lang.Class<K> sequenceKeyClass,
java.lang.Class<V> sequenceValueClass)
Get an RDD from a sequence file input
|
protected static void |
setFileSystemCreator(FileSystemCreator fileSystemCreator) |
static org.apache.spark.api.java.JavaRDD<java.lang.String> |
textFile(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path)
Get an RDD from a Text file input
|
public static org.apache.spark.api.java.JavaRDD<org.openstreetmap.atlas.geography.atlas.Atlas> atlasFiles(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path)
context - The context from Sparkpath - The path to a set of atlas filespublic static org.apache.spark.api.java.JavaPairRDD<java.lang.String,org.apache.spark.input.PortableDataStream> binaryFile(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path)
context - The context from Sparkpath - The path to a set of binary filespublic static <K extends org.apache.hadoop.io.Writable,V extends org.apache.hadoop.io.Writable> org.apache.spark.api.java.JavaPairRDD<K,V> sequenceFile(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path,
java.lang.Class<K> sequenceKeyClass,
java.lang.Class<V> sequenceValueClass)
K - The key type in the sequence fileV - The value type in the sequence filecontext - The context from Sparkpath - The path to a set of sequence filessequenceKeyClass - The class to expect for the sequence file keyssequenceValueClass - The class to expect for the sequence file valuespublic static org.apache.spark.api.java.JavaRDD<java.lang.String> textFile(org.apache.spark.api.java.JavaSparkContext context,
java.lang.String path)
context - The context from Sparkpath - The path to openString line per item.protected static void setFileSystemCreator(FileSystemCreator fileSystemCreator)