AutoCacheRule

Instance Constructors

new AutoCacheRule(cachingMode: CachingStrategy)

Type Members

case class ProfilingState(registers: Map[NodeId, Expression], numPerPartitionPerNode: Map[NodeId, Map[Int, Int]], profiles: Map[NodeId, Profile]) extends Product with Serializable

Value Members

final def !=(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def !=(arg0: Any): Boolean

Definition Classes
Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def ==(arg0: Any): Boolean

Definition Classes
Any
def addCachesToPipeline(pipe: Graph, cachesToAdd: Set[NodeId]): Graph

Given a pipeline DAG and an additional set of nodes to cache - return a DAG with the nodes cached.
def aggressiveCache(graph: Graph): Graph
def apply(plan: Graph, prefixes: Map[NodeId, Prefix]): (Graph, Map[NodeId, Prefix])

Definition Classes
AutoCacheRule → Rule
final def asInstanceOf[T0]: T0

Definition Classes
Any
def cachedMem(cached: Set[NodeId], profiles: Map[NodeId, Profile]): Long
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def estimateCachedRunTime(graph: Graph, linearization: Seq[GraphId], childrenByNode: Map[NodeId, Seq[GraphId]], cached: Set[NodeId], profiles: Map[NodeId, Profile]): Double

Estimates the total runtime of a pipeline given the cached set of nodes
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def generalizeProfiles(newScale: Long, sampleProfiles: Seq[SampleProfile]): Profile

This method takes a sequence of profiles at different sample sizes, and generalizes them to a new data scale by fitting then using linear models for memory and cpu usage dependent on data scale.
def getChildrenForAllNodes(graph: Graph): Map[NodeId, Seq[GraphId]]

Get a map representing the children for each node Note: This doesn't capture how many times each child depended on the instruction
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def getDescendantsOfSources(graph: Graph): Set[NodeId]

Get all descendents of all sources in the graph
def getNodeWeights(graph: Graph): Map[NodeId, Int]

Get the operator weights: estimates for how many passes an operator will make over its input dependencies
def getRuns(linearization: Seq[GraphId], childrenByNode: Map[NodeId, Seq[GraphId]], cached: Set[NodeId], nodeWeights: Map[NodeId, Int]): Map[NodeId, Int]

Get an estimate for how many times the output of each node will be accessed, assuming the given set of nodes have their outputs cached.
Get an estimate for how many times the output of each node will be accessed, assuming the given set of nodes have their outputs cached.
Note: This assumes all sinks are accessed exactly once!
def greedyCache(graph: Graph, profiles: Map[NodeId, Profile], maxMem: Option[Long]): Graph
def hashCode(): Int

Definition Classes
AnyRef → Any
def initCacheSet(graph: Graph): Set[NodeId]

Get the initial set of what nodes will have their results effectively cached
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def log: Logger

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def profileNodes(graph: Graph, linearization: Seq[GraphId], nodesToProfile: Set[NodeId], partitionScales: Seq[Long], numTrials: Int): Map[NodeId, Profile]

Get profiles of nodes in the pipeline
Get profiles of nodes in the pipeline
graph
The pipeline DAG
linearization
A linearization in the nodes of the pipeline DAG
nodesToProfile
The nodes to collect profiling information for
partitionScales
The scales to profile at (expected number of data points per partition)
numTrials
The number of times to profile at each scale
returns
val ruleName: String

Name for this rule, automatically inferred based on class name.
Name for this rule, automatically inferred based on class name.

Definition Classes
Rule
def selectNext(graph: Graph, linearization: Seq[GraphId], profiles: Map[NodeId, Profile], childrenByNode: Map[NodeId, Seq[GraphId]], cached: Set[NodeId], runs: Map[NodeId, Int], spaceLeft: Long): NodeId
def stillRoom(cached: Set[NodeId], runs: Map[NodeId, Int], profiles: Map[NodeId, Profile], spaceLeft: Long): Boolean

Returns true iff there is still an uncached node whose output is used > once, that would fit in memory if cached
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

class AutoCacheRule extends Rule with Logging

Instance Constructors

new AutoCacheRule(cachingMode: CachingStrategy)

Type Members

case class ProfilingState(registers: Map[NodeId, Expression], numPerPartitionPerNode: Map[NodeId, Map[Int, Int]], profiles: Map[NodeId, Profile]) extends Product with Serializable

Value Members

final def !=(arg0: AnyRef): Boolean

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: AnyRef): Boolean

final def ==(arg0: Any): Boolean

def addCachesToPipeline(pipe: Graph, cachesToAdd: Set[NodeId]): Graph

def aggressiveCache(graph: Graph): Graph

def apply(plan: Graph, prefixes: Map[NodeId, Prefix]): (Graph, Map[NodeId, Prefix])

final def asInstanceOf[T0]: T0

def cachedMem(cached: Set[NodeId], profiles: Map[NodeId, Profile]): Long

def clone(): AnyRef

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def estimateCachedRunTime(graph: Graph, linearization: Seq[GraphId], childrenByNode: Map[NodeId, Seq[GraphId]], cached: Set[NodeId], profiles: Map[NodeId, Profile]): Double

def finalize(): Unit

def generalizeProfiles(newScale: Long, sampleProfiles: Seq[SampleProfile]): Profile

def getChildrenForAllNodes(graph: Graph): Map[NodeId, Seq[GraphId]]

final def getClass(): Class[_]

def getDescendantsOfSources(graph: Graph): Set[NodeId]

def getNodeWeights(graph: Graph): Map[NodeId, Int]

def getRuns(linearization: Seq[GraphId], childrenByNode: Map[NodeId, Seq[GraphId]], cached: Set[NodeId], nodeWeights: Map[NodeId, Int]): Map[NodeId, Int]

def greedyCache(graph: Graph, profiles: Map[NodeId, Profile], maxMem: Option[Long]): Graph

def hashCode(): Int

def initCacheSet(graph: Graph): Set[NodeId]

final def isInstanceOf[T0]: Boolean

def log: Logger

def logDebug(msg: ⇒ String, throwable: Throwable): Unit

def logDebug(msg: ⇒ String): Unit

def logError(msg: ⇒ String, throwable: Throwable): Unit

def logError(msg: ⇒ String): Unit

def logInfo(msg: ⇒ String, throwable: Throwable): Unit

def logInfo(msg: ⇒ String): Unit

def logTrace(msg: ⇒ String, throwable: Throwable): Unit

def logTrace(msg: ⇒ String): Unit

def logWarning(msg: ⇒ String, throwable: Throwable): Unit

def logWarning(msg: ⇒ String): Unit

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def profileNodes(graph: Graph, linearization: Seq[GraphId], nodesToProfile: Set[NodeId], partitionScales: Seq[Long], numTrials: Int): Map[NodeId, Profile]

val ruleName: String

def selectNext(graph: Graph, linearization: Seq[GraphId], profiles: Map[NodeId, Profile], childrenByNode: Map[NodeId, Seq[GraphId]], cached: Set[NodeId], runs: Map[NodeId, Int], spaceLeft: Long): NodeId

def stillRoom(cached: Set[NodeId], runs: Map[NodeId, Int], profiles: Map[NodeId, Profile], spaceLeft: Long): Boolean

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from Logging

Inherited from Rule

Inherited from AnyRef

Inherited from Any

Ungrouped