SparkPlanner

Instance Constructors

new SparkPlanner()

Type Members

case class CommandStrategy extends Strategy with Product with Serializable

Definition Classes
SparkStrategies

Value Members

final def !=(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def !=(arg0: Any): Boolean

Definition Classes
Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def ==(arg0: Any): Boolean

Definition Classes
Any
object BasicOperators extends Strategy

Definition Classes
SparkStrategies
object BroadcastNestedLoopJoin extends Strategy

Definition Classes
SparkStrategies
object CartesianProduct extends Strategy

Definition Classes
SparkStrategies
object HashAggregation extends Strategy

Definition Classes
SparkStrategies
object HashJoin extends Strategy with PredicateHelper

Uses the ExtractEquiJoinKeys pattern to find joins where at least some of the predicates can be evaluated by matching hash keys.
Uses the ExtractEquiJoinKeys pattern to find joins where at least some of the predicates can be evaluated by matching hash keys.
This strategy applies a simple optimization based on the estimates of the physical sizes of the two join sides. When planning a joins.BroadcastHashJoin, if one side has an estimated physical size smaller than the user-settable threshold org.apache.spark.sql.SQLConf.AUTO_BROADCASTJOIN_THRESHOLD, the planner would mark it as the build relation and mark the other relation as the stream side. The build table will be broadcasted to all of the executors involved in the join, as a org.apache.spark.broadcast.Broadcast object. If both estimates exceed the threshold, they will instead be used to decide the build side in a joins.ShuffledHashJoin.

Definition Classes
SparkStrategies
object InMemoryScans extends Strategy

Definition Classes
SparkStrategies
object LeftSemiJoin extends Strategy with PredicateHelper

Definition Classes
SparkStrategies
object ParquetOperations extends Strategy

Definition Classes
SparkStrategies
object TakeOrdered extends Strategy

Definition Classes
SparkStrategies
def apply(plan: LogicalPlan): Iterator[SparkPlan]

Definition Classes
QueryPlanner
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def codegenEnabled: Boolean
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def numPartitions: Int
def planLater(plan: LogicalPlan): SparkPlan

Attributes
protected
Definition Classes
QueryPlanner
def pruneFilterProject(projectList: Seq[NamedExpression], filterPredicates: Seq[Expression], prunePushedDownFilters: (Seq[Expression]) ⇒ Seq[Expression], scanBuilder: (Seq[Attribute]) ⇒ SparkPlan): SparkPlan

Used to build table scan operators where complex projection and filtering are done using separate physical operators.
Used to build table scan operators where complex projection and filtering are done using separate physical operators. This function returns the given scan operator with Project and Filter nodes added only when needed. For example, a Project operator is only used when the final desired output requires complex expressions to be evaluated or when columns can be further eliminated out after filtering has been done.
The prunePushedDownFilters parameter is used to remove those filters that can be optimized away by the filter pushdown optimization.
The required attributes for both filtering and expression evaluation are passed to the provided scanBuilder function so that it can avoid unnecessary column materialization.
lazy val singleRowRdd: RDD[catalyst.expressions.Row]

Attributes
protected
Definition Classes
SparkStrategies
val sparkContext: SparkContext
val sqlContext: SQLContext
def strategies: Seq[Strategy]

Definition Classes
SparkPlanner → QueryPlanner
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

class SparkPlanner extends SparkStrategies

Instance Constructors

new SparkPlanner()

Type Members

case class CommandStrategy extends Strategy with Product with Serializable

Value Members

final def !=(arg0: AnyRef): Boolean

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: AnyRef): Boolean

final def ==(arg0: Any): Boolean

object BasicOperators extends Strategy

object BroadcastNestedLoopJoin extends Strategy

object CartesianProduct extends Strategy

object HashAggregation extends Strategy

object HashJoin extends Strategy with PredicateHelper

object InMemoryScans extends Strategy

object LeftSemiJoin extends Strategy with PredicateHelper

object ParquetOperations extends Strategy

object TakeOrdered extends Strategy

def apply(plan: LogicalPlan): Iterator[SparkPlan]

final def asInstanceOf[T0]: T0

def clone(): AnyRef

def codegenEnabled: Boolean

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def numPartitions: Int

def planLater(plan: LogicalPlan): SparkPlan

def pruneFilterProject(projectList: Seq[NamedExpression], filterPredicates: Seq[Expression], prunePushedDownFilters: (Seq[Expression]) ⇒ Seq[Expression], scanBuilder: (Seq[Attribute]) ⇒ SparkPlan): SparkPlan

lazy val singleRowRdd: RDD[catalyst.expressions.Row]

val sparkContext: SparkContext

val sqlContext: SQLContext

def strategies: Seq[Strategy]

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from SparkStrategies

Inherited from QueryPlanner[SparkPlan]

Inherited from AnyRef

Inherited from Any

Ungrouped