CompareADAM

CompareADAM is a tool for pairwise comparison of ADAM files (or merged sets of ADAM files, see the note on the -recurse{1,2} optional parameters, below).

The canonical use-case for CompareADAM involves a single input file run through (for example) two different implementations of the same pipeline, producing two comparable ADAM files at the end.

CompareADAM will load these ADAM files and perform a read-name-based equi-join. It then computes one or more metrics (embodied as BucketComparisons values) across the joined records, as specified on the command-line, and aggregates each metric into a histogram (although, this can be modified if other aggregations are required in the future) and outputs the resulting histograms to a specified directory as text files.

There is an R script in the adam-scripts module to process those outputs into a figure.

The available metrics to be calculated are defined, by name, in the DefaultComparisons object.

A subsequent tool like FindReads can be used to track down which reads give rise to particular aggregated bins in the output histograms, if further diagnosis is needed.

Linear Supertypes

Serializable, Serializable, BDGCommandCompanion, AnyRef, Any

Type Members

type GeneratedResults[A] = RDD[(String, Seq[A])]

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def apply(cmdLine: Array[String]): BDGCommand

Definition Classes
CompareADAM → BDGCommandCompanion
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
val commandDescription: String

Definition Classes
CompareADAM → BDGCommandCompanion
val commandName: String

Definition Classes
CompareADAM → BDGCommandCompanion
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def main(cmdLine: Array[String]): Unit

Definition Classes
BDGCommandCompanion
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def parseGenerators(names: Seq[String]): Seq[BucketComparisons[Any]]
def parseGenerators(nameList: String): Seq[BucketComparisons[Any]]
def setupTraversalEngine(sc: SparkContext, input1Path: String, recurse1: String, input2Path: String, recurse2: String, generator: BucketComparisons[Any]): ComparisonTraversalEngine

See also
CompareADAMArgs.recurse1, CompareADAMArgs.recurse2
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

object CompareADAM extends BDGCommandCompanion with Serializable

Type Members

type GeneratedResults[A] = RDD[(String, Seq[A])]

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

def apply(cmdLine: Array[String]): BDGCommand

final def asInstanceOf[T0]: T0

def clone(): AnyRef

val commandDescription: String

val commandName: String

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

def main(cmdLine: Array[String]): Unit

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def parseGenerators(names: Seq[String]): Seq[BucketComparisons[Any]]

def parseGenerators(nameList: String): Seq[BucketComparisons[Any]]

def setupTraversalEngine(sc: SparkContext, input1Path: String, recurse1: String, input2Path: String, recurse2: String, generator: BucketComparisons[Any]): ComparisonTraversalEngine

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from Serializable

Inherited from Serializable

Inherited from BDGCommandCompanion

Inherited from AnyRef

Inherited from Any

Ungrouped