class
CatalystHashFunction extends AnyRef
Instance Constructors
-
new
CatalystHashFunction()
Value Members
-
final
def
!=(arg0: AnyRef): Boolean
-
final
def
!=(arg0: Any): Boolean
-
final
def
##(): Int
-
final
def
==(arg0: AnyRef): Boolean
-
final
def
==(arg0: Any): Boolean
-
final
def
asInstanceOf[T0]: T0
-
def
clone(): AnyRef
-
def
computeHash(key: Any): Int
-
def
computeHashCode(str: String): Int
-
def
computeHashCode(time: Timestamp): Int
-
def
computeHashCode(sd: Date): Int
-
final
def
eq(arg0: AnyRef): Boolean
-
def
equals(arg0: Any): Boolean
-
def
finalize(): Unit
-
final
def
getClass(): Class[_]
-
def
hashCode(): Int
-
def
hashValue(objs: Array[AnyRef]): Int
-
def
hashValue(key: Any): Int
-
final
def
isInstanceOf[T0]: Boolean
-
final
def
ne(arg0: AnyRef): Boolean
-
final
def
notify(): Unit
-
final
def
notifyAll(): Unit
-
final
def
synchronized[T0](arg0: ⇒ T0): T0
-
def
toString(): String
-
final
def
wait(): Unit
-
final
def
wait(arg0: Long, arg1: Int): Unit
-
final
def
wait(arg0: Long): Unit
Inherited from AnyRef
Inherited from Any
This class acts as a public interface to the hashcode logic implemented at catalyst layer. It ensures Spark's partitioning and store's partitioning follows the same logic. This helps in reducing shuffle operations when Spark's DataFrame is joined with store data. PairRDD's can also use this partitioner to colocate their data with Store tables/DataFrames.