public class SparkUtils extends Object
Modifier and Type | Field and Description |
---|---|
static org.apache.spark.storage.StorageLevel |
DEFAULT_TMP |
Constructor and Description |
---|
SparkUtils() |
Modifier and Type | Method and Description |
---|---|
static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixCell> |
cacheBinaryCellRDD(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixCell> input) |
static MatrixCharacteristics |
computeMatrixCharacteristics(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixCell> input)
Utility to compute dimensions and non-zeros in a given RDD of binary cells.
|
static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> |
copyBinaryBlockMatrix(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> in)
Creates a partitioning-preserving deep copy of the input matrix RDD, where
the indexes and values are copied.
|
static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> |
copyBinaryBlockMatrix(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> in,
boolean deep)
Creates a partitioning-preserving copy of the input matrix RDD.
|
static List<scala.Tuple2<Long,FrameBlock>> |
fromIndexedFrameBlock(List<Pair<Long,FrameBlock>> in) |
static scala.Tuple2<Long,FrameBlock> |
fromIndexedFrameBlock(Pair<Long,FrameBlock> in) |
static scala.Tuple2<MatrixIndexes,MatrixBlock> |
fromIndexedMatrixBlock(org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue in) |
static List<scala.Tuple2<MatrixIndexes,MatrixBlock>> |
fromIndexedMatrixBlock(List<org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue> in) |
static Pair<MatrixIndexes,MatrixBlock> |
fromIndexedMatrixBlockToPair(org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue in) |
static List<Pair<MatrixIndexes,MatrixBlock>> |
fromIndexedMatrixBlockToPair(List<org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue> in) |
static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> |
getEmptyBlockRDD(org.apache.spark.api.java.JavaSparkContext sc,
MatrixCharacteristics mc)
Creates an RDD of empty blocks according to the given matrix characteristics.
|
static long |
getNonZeros(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> input) |
static int |
getNumPreferredPartitions(MatrixCharacteristics mc) |
static int |
getNumPreferredPartitions(MatrixCharacteristics mc,
org.apache.spark.api.java.JavaPairRDD<?,?> in) |
static String |
getPrefixFromSparkDebugInfo(String line) |
static String |
getStartLineFromSparkDebugInfo(String line) |
static boolean |
isHashPartitioned(org.apache.spark.api.java.JavaPairRDD<?,?> in)
Indicates if the input RDD is hash partitioned, i.e., it has a partitioner
of type
org.apache.spark.HashPartitioner . |
static Pair<Long,FrameBlock> |
toIndexedFrameBlock(scala.Tuple2<Long,FrameBlock> in) |
static List<Pair<Long,Long>> |
toIndexedLong(List<scala.Tuple2<Long,Long>> in) |
static org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue |
toIndexedMatrixBlock(MatrixIndexes ix,
MatrixBlock mb) |
static org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue |
toIndexedMatrixBlock(scala.Tuple2<MatrixIndexes,MatrixBlock> in) |
public static org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue toIndexedMatrixBlock(scala.Tuple2<MatrixIndexes,MatrixBlock> in)
public static org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue toIndexedMatrixBlock(MatrixIndexes ix, MatrixBlock mb)
public static scala.Tuple2<MatrixIndexes,MatrixBlock> fromIndexedMatrixBlock(org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue in)
public static List<scala.Tuple2<MatrixIndexes,MatrixBlock>> fromIndexedMatrixBlock(List<org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue> in)
public static Pair<MatrixIndexes,MatrixBlock> fromIndexedMatrixBlockToPair(org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue in)
public static List<Pair<MatrixIndexes,MatrixBlock>> fromIndexedMatrixBlockToPair(List<org.apache.sysml.runtime.matrix.mapred.IndexedMatrixValue> in)
public static scala.Tuple2<Long,FrameBlock> fromIndexedFrameBlock(Pair<Long,FrameBlock> in)
public static List<scala.Tuple2<Long,FrameBlock>> fromIndexedFrameBlock(List<Pair<Long,FrameBlock>> in)
public static Pair<Long,FrameBlock> toIndexedFrameBlock(scala.Tuple2<Long,FrameBlock> in)
public static boolean isHashPartitioned(org.apache.spark.api.java.JavaPairRDD<?,?> in)
org.apache.spark.HashPartitioner
.in
- input JavaPairRDDpublic static int getNumPreferredPartitions(MatrixCharacteristics mc, org.apache.spark.api.java.JavaPairRDD<?,?> in)
public static int getNumPreferredPartitions(MatrixCharacteristics mc)
public static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> copyBinaryBlockMatrix(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> in)
in
- matrix as JavaPairRDD<MatrixIndexes,MatrixBlock>
JavaPairRDD<MatrixIndexes,MatrixBlock>
public static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> copyBinaryBlockMatrix(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> in, boolean deep)
in
- matrix as JavaPairRDD<MatrixIndexes,MatrixBlock>
deep
- if true, perform deep copyJavaPairRDD<MatrixIndexes,MatrixBlock>
public static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> getEmptyBlockRDD(org.apache.spark.api.java.JavaSparkContext sc, MatrixCharacteristics mc)
sc
- spark contextmc
- matrix characteristicspublic static org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixCell> cacheBinaryCellRDD(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixCell> input)
public static MatrixCharacteristics computeMatrixCharacteristics(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixCell> input)
input
- matrix as JavaPairRDD<MatrixIndexes, MatrixCell>
public static long getNonZeros(org.apache.spark.api.java.JavaPairRDD<MatrixIndexes,MatrixBlock> input)
Copyright © 2018 The Apache Software Foundation. All rights reserved.