SharkSemanticAnalyzer

Instance Constructors

new SharkSemanticAnalyzer(conf: HiveConf)

Type Members

class AnalyzeCreateCommonVars extends AnyRef

Attributes
private[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
class RowFormatParams extends AnyRef

Attributes
private[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
class StorageFormat extends AnyRef

Attributes
private[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer

Value Members

final def !=(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def !=(arg0: Any): Boolean

Definition Classes
Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def ==(arg0: Any): Boolean

Definition Classes
Any
var _resSchema: List[FieldSchema]
def analyze(arg0: ASTNode, arg1: Context): Unit

Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def analyzeCreateTable(rootAST: ASTNode, queryBlock: QueryBlock): Option[ASTNode]
def analyzeDDLSkewedValues(arg0: List[List[String]], arg1: ASTNode): Unit

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def analyzeInternal(ast: ASTNode): Unit

Override SemanticAnalyzer.
Override SemanticAnalyzer.analyzeInternal to handle CTAS caching and INSERT updates.
Unified views: For CTAS and INSERT INTO/OVERWRITE the generated Shark query plan matches the one created if the target table were not cached. Disk => memory loading is done by a SparkLoadTask that executes _after_ all other tasks (SparkTask, Hive MoveTasks) finish executing. For INSERT INTO, the SparkLoadTask will be able to determine, using a path filter based on a snapshot of the table/partition data directory taken in genMapRedTasks(), new files that should be loaded into the cache. For CTAS, a path filter isn't used - everything in the data directory is loaded into the cache.
Non-unified views (i.e., the cached table content is memory-only): The query plan's FileSinkOperator is replaced by a MemoryStoreSinkOperator. The MemoryStoreSinkOperator creates a new table (or partition) entry in the Shark metastore for CTAS, and creates UnionRDDs for INSERT INTO commands.

Definition Classes
SharkSemanticAnalyzer → SemanticAnalyzer → BaseSemanticAnalyzer
def analyzeSkewedTablDDLColNames(arg0: List[String], arg1: ASTNode): List[String]

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def analyzeStoredAdDirs(arg0: ASTNode): Boolean

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def constructListBucketingCtx(arg0: List[String], arg1: List[List[String]], arg2: Map[SkewedValueList, String], arg3: Boolean, arg4: HiveConf): ListBucketingCtx

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
def doPhase1(arg0: ASTNode, arg1: QB, arg2: Phase1Ctx): Boolean

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def doPhase1QBExpr(arg0: ASTNode, arg1: QBExpr, arg2: String, arg3: String): Unit

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def errStream(): PrintStream

Definition Classes
LogHelper
def extractPartitionSpecs(arg0: Tree): HashMap[String, String]

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def genAllExprNodeDesc(arg0: ASTNode, arg1: RowResolver, arg2: TypeCheckCtx): Map[ASTNode, ExprNodeDesc]

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def genAllExprNodeDesc(arg0: ASTNode, arg1: RowResolver): Map[ASTNode, ExprNodeDesc]

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def genExprNodeDesc(arg0: ASTNode, arg1: RowResolver, arg2: TypeCheckCtx): ExprNodeDesc

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def genExprNodeDesc(arg0: ASTNode, arg1: RowResolver): ExprNodeDesc

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def genMapRedTasks(qb: QueryBlock, pctx: ParseContext, terminalOps: Seq[TerminalOperator]): Unit

Generate tasks for executing the query, including the SparkTask to do the select, the MoveTask for updates, and the DDLTask for CTAS.
def genPlan(arg0: QB): Operator[_ <: OperatorDesc]

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def getColumnAccessInfo(): ColumnAccessInfo

Definition Classes
BaseSemanticAnalyzer
def getColumnNames(arg0: ASTNode): List[String]

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
def getColumnNamesOrder(arg0: ASTNode): List[Order]

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
def getColumns(arg0: ASTNode): List[FieldSchema]

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def getDb(): Hive

Definition Classes
BaseSemanticAnalyzer
def getFetchTask(): FetchTask

Definition Classes
BaseSemanticAnalyzer
def getIdToTableNameMap(): HashMap[String, String]

Definition Classes
BaseSemanticAnalyzer
def getInputs(): HashSet[ReadEntity]

Definition Classes
BaseSemanticAnalyzer
def getLineageInfo(): LineageInfo

Definition Classes
BaseSemanticAnalyzer
def getMetaData(arg0: QB, arg1: ReadEntity): Unit

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def getMetaData(arg0: QB): Unit

Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def getOutputs(): HashSet[WriteEntity]

Definition Classes
BaseSemanticAnalyzer
def getParseContext(): ParseContext

Definition Classes
SemanticAnalyzer
def getQB(): QB

Definition Classes
SemanticAnalyzer
def getQueryProperties(): QueryProperties

Definition Classes
BaseSemanticAnalyzer
def getResultSchema(): List[FieldSchema]

This is used in driver to get the result schema.
This is used in driver to get the result schema.

Definition Classes
SharkSemanticAnalyzer → SemanticAnalyzer → BaseSemanticAnalyzer
def getRootTasks(): List[Task[_ <: Serializable]]

Definition Classes
BaseSemanticAnalyzer
def getRowResolver(arg0: Operator[_ <: OperatorDesc]): RowResolver

Definition Classes
SemanticAnalyzer
def getSkewedValueFromASTNode(arg0: ASTNode): List[String]

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
def getSkewedValuesFromASTNode(arg0: Node): List[String]

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def getTableAccessInfo(): TableAccessInfo

Definition Classes
BaseSemanticAnalyzer
def handleGenericFileFormat(arg0: ASTNode): Unit

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def hashCode(): Int

Definition Classes
AnyRef → Any
def init(): Unit

Definition Classes
SemanticAnalyzer → BaseSemanticAnalyzer
def initCtx(arg0: Context): Unit

Definition Classes
BaseSemanticAnalyzer
def initParseCtx(arg0: ParseContext): Unit

Definition Classes
SemanticAnalyzer
def initPhase1Ctx(): Phase1Ctx

Definition Classes
SemanticAnalyzer
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def isTraceEnabled(): Boolean

Attributes
protected
Definition Classes
Logging
final def isValidPrefixSpec(arg0: Table, arg1: Map[String, String]): Boolean

Definition Classes
BaseSemanticAnalyzer
Annotations
@throws( ... )
def log: Logger

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: String, exception: Throwable): Unit

Definition Classes
LogHelper
def logError(msg: String, detail: String): Unit

Definition Classes
LogHelper
def logError(msg: ⇒ String): Unit

Definition Classes
LogHelper → Logging
def logError(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def outStream(): PrintStream

Definition Classes
LogHelper
def processNoScanCommand(arg0: ASTNode): Unit

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def processPartialScanCommand(arg0: ASTNode): Unit

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
SemanticAnalyzer
Annotations
@throws( ... )
def putOpInsertMap[T <: OperatorDesc](arg0: Operator[T], arg1: RowResolver): Operator[T]

Definition Classes
SemanticAnalyzer
def reset(): Unit

Attributes
protected[org.apache.hadoop.hive.ql.parse]
Definition Classes
SemanticAnalyzer → BaseSemanticAnalyzer
def setColumnAccessInfo(arg0: ColumnAccessInfo): Unit

Definition Classes
BaseSemanticAnalyzer
def setFetchTask(arg0: FetchTask): Unit

Definition Classes
BaseSemanticAnalyzer
def setLineageInfo(arg0: LineageInfo): Unit

Definition Classes
BaseSemanticAnalyzer
def setQB(arg0: QB): Unit

Definition Classes
SemanticAnalyzer
def setTableAccessInfo(arg0: TableAccessInfo): Unit

Definition Classes
BaseSemanticAnalyzer
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
def validate(): Unit

Definition Classes
SemanticAnalyzer → BaseSemanticAnalyzer
Annotations
@throws( ... )
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

class SharkSemanticAnalyzer extends SemanticAnalyzer with LogHelper

Instance Constructors

new SharkSemanticAnalyzer(conf: HiveConf)

Type Members

class AnalyzeCreateCommonVars extends AnyRef

class RowFormatParams extends AnyRef

class StorageFormat extends AnyRef

Value Members

final def !=(arg0: AnyRef): Boolean

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: AnyRef): Boolean

final def ==(arg0: Any): Boolean

var _resSchema: List[FieldSchema]

def analyze(arg0: ASTNode, arg1: Context): Unit

def analyzeCreateTable(rootAST: ASTNode, queryBlock: QueryBlock): Option[ASTNode]

def analyzeDDLSkewedValues(arg0: List[List[String]], arg1: ASTNode): Unit

def analyzeInternal(ast: ASTNode): Unit

def analyzeSkewedTablDDLColNames(arg0: List[String], arg1: ASTNode): List[String]

def analyzeStoredAdDirs(arg0: ASTNode): Boolean

final def asInstanceOf[T0]: T0

def clone(): AnyRef

def constructListBucketingCtx(arg0: List[String], arg1: List[List[String]], arg2: Map[SkewedValueList, String], arg3: Boolean, arg4: HiveConf): ListBucketingCtx

def doPhase1(arg0: ASTNode, arg1: QB, arg2: Phase1Ctx): Boolean

def doPhase1QBExpr(arg0: ASTNode, arg1: QBExpr, arg2: String, arg3: String): Unit

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def errStream(): PrintStream

def extractPartitionSpecs(arg0: Tree): HashMap[String, String]

def finalize(): Unit

def genAllExprNodeDesc(arg0: ASTNode, arg1: RowResolver, arg2: TypeCheckCtx): Map[ASTNode, ExprNodeDesc]

def genAllExprNodeDesc(arg0: ASTNode, arg1: RowResolver): Map[ASTNode, ExprNodeDesc]

def genExprNodeDesc(arg0: ASTNode, arg1: RowResolver, arg2: TypeCheckCtx): ExprNodeDesc

def genExprNodeDesc(arg0: ASTNode, arg1: RowResolver): ExprNodeDesc

def genMapRedTasks(qb: QueryBlock, pctx: ParseContext, terminalOps: Seq[TerminalOperator]): Unit

def genPlan(arg0: QB): Operator[_ <: OperatorDesc]

final def getClass(): Class[_]

def getColumnAccessInfo(): ColumnAccessInfo

def getColumnNames(arg0: ASTNode): List[String]

def getColumnNamesOrder(arg0: ASTNode): List[Order]

def getColumns(arg0: ASTNode): List[FieldSchema]

def getDb(): Hive

def getFetchTask(): FetchTask

def getIdToTableNameMap(): HashMap[String, String]

def getInputs(): HashSet[ReadEntity]

def getLineageInfo(): LineageInfo

def getMetaData(arg0: QB, arg1: ReadEntity): Unit

def getMetaData(arg0: QB): Unit

def getOutputs(): HashSet[WriteEntity]

def getParseContext(): ParseContext

def getQB(): QB

def getQueryProperties(): QueryProperties

def getResultSchema(): List[FieldSchema]

def getRootTasks(): List[Task[_ <: Serializable]]

def getRowResolver(arg0: Operator[_ <: OperatorDesc]): RowResolver

def getSkewedValueFromASTNode(arg0: ASTNode): List[String]

def getSkewedValuesFromASTNode(arg0: Node): List[String]

def getTableAccessInfo(): TableAccessInfo

def handleGenericFileFormat(arg0: ASTNode): Unit

def hashCode(): Int

def init(): Unit

def initCtx(arg0: Context): Unit

def initParseCtx(arg0: ParseContext): Unit

def initPhase1Ctx(): Phase1Ctx

final def isInstanceOf[T0]: Boolean

def isTraceEnabled(): Boolean

final def isValidPrefixSpec(arg0: Table, arg1: Map[String, String]): Boolean

def log: Logger

def logDebug(msg: ⇒ String, throwable: Throwable): Unit

def logDebug(msg: ⇒ String): Unit

def logError(msg: String, exception: Throwable): Unit

def logError(msg: String, detail: String): Unit

def logError(msg: ⇒ String): Unit

def logError(msg: ⇒ String, throwable: Throwable): Unit

def logInfo(msg: ⇒ String, throwable: Throwable): Unit

def logInfo(msg: ⇒ String): Unit

def logTrace(msg: ⇒ String, throwable: Throwable): Unit

def logTrace(msg: ⇒ String): Unit

def logWarning(msg: ⇒ String, throwable: Throwable): Unit