object AlgebirdRDDMetrics
Metrics based on using the Algebird library (abstract algebra for Scala) https://github.com/twitter/algebird
- Alphabetic
- By Inheritance
- AlgebirdRDDMetrics
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Type Members
-
case class
HLLSequenceCompletenessRDDMetricCalculator(hLL: HLL, bitsNumber: Int, minVal: Long, maxVal: Long, accuracyError: Double, increment: Long, failCount: Long = 0, status: CalculatorStatus = CalculatorStatus.Success, failMsg: String = "OK") extends RDDMetricCalculator with Product with Serializable
Calculates approximate completeness of incremental integer (long) sequence, i.e.
Calculates approximate completeness of incremental integer (long) sequence, i.e. checks if sequence does not have missing elements. Check is performed using variance algorithm HyperLogLog. Works for single column only!
- hLL
Initial HyperLogLog monoid
- bitsNumber
Size of HLL (calculates automatically for a specific accuracy error)
- minVal
Minimum observed value in a sequence
- maxVal
Maximum observed value in a sequence
- accuracyError
Error of calculation
- increment
Sequence increment
- returns
result map with keys: "APPROXIMATE_SEQUENCE_COMPLETENESS"
-
case class
HyperLogLogRDDMetricCalculator(hLL: HLL, bitsNumber: Int, accuracyError: Double, failCount: Long = 0, status: CalculatorStatus = CalculatorStatus.Success, failMsg: String = "OK") extends RDDMetricCalculator with Product with Serializable
Calculates number of distinct values in processed elements
Calculates number of distinct values in processed elements
Works for single column only!
- hLL
Initial HyperLogLog monoid
- bitsNumber
Size of HLL (calculates automatically for a specific accuracy error)
- accuracyError
Error of calculation.
- returns
result map with keys: "APPROXIMATE_DISTINCT_VALUES"
-
case class
TopKRDDMetricCalculator(list: SpaceSaver[String], maxCapacity: Int, targetNumber: Int, rowCount: Int, failCount: Long = 0, status: CalculatorStatus = CalculatorStatus.Success, failMsg: String = "OK") extends RDDMetricCalculator with Product with Serializable
Calculates top N elements out of processed elements
Calculates top N elements out of processed elements
Works for single column only!
- list
Initial SpaceSaver monoid
- maxCapacity
Maximal size of SpaceSaver
- targetNumber
Required N
- returns
result map with keys: "TOP_N_{index}"
Value Members
-
final
def
!=(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
##(): Int
- Definition Classes
- AnyRef → Any
-
final
def
==(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
asInstanceOf[T0]: T0
- Definition Classes
- Any
-
def
clone(): AnyRef
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
-
final
def
eq(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
def
equals(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
def
finalize(): Unit
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( classOf[java.lang.Throwable] )
-
final
def
getClass(): Class[_]
- Definition Classes
- AnyRef → Any
- Annotations
- @native()
-
def
hashCode(): Int
- Definition Classes
- AnyRef → Any
- Annotations
- @native()
-
final
def
isInstanceOf[T0]: Boolean
- Definition Classes
- Any
-
final
def
ne(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
final
def
notify(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
final
def
notifyAll(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
final
def
synchronized[T0](arg0: ⇒ T0): T0
- Definition Classes
- AnyRef
-
def
toString(): String
- Definition Classes
- AnyRef → Any
-
final
def
wait(): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long, arg1: Int): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()