1 PREHOOK: query: create table student_2_lines(
6 fields terminated by '\001'
8 PREHOOK: type: CREATETABLE
9 PREHOOK: Output: database:default
10 PREHOOK: Output: default@student_2_lines
11 POSTHOOK: query: create table student_2_lines(
16 fields terminated by '\001'
18 POSTHOOK: type: CREATETABLE
19 POSTHOOK: Output: database:default
20 POSTHOOK: Output: default@student_2_lines
21 PREHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/student_2_lines' OVERWRITE INTO TABLE student_2_lines
23 #### A masked pattern was here ####
24 PREHOOK: Output: default@student_2_lines
25 POSTHOOK: query: LOAD DATA LOCAL INPATH '../../data/files/student_2_lines' OVERWRITE INTO TABLE student_2_lines
27 #### A masked pattern was here ####
28 POSTHOOK: Output: default@student_2_lines
29 PREHOOK: query: analyze table student_2_lines compute statistics
31 PREHOOK: Input: default@student_2_lines
32 PREHOOK: Output: default@student_2_lines
33 POSTHOOK: query: analyze table student_2_lines compute statistics
35 POSTHOOK: Input: default@student_2_lines
36 POSTHOOK: Output: default@student_2_lines
37 PREHOOK: query: create table insert_10_1 (a float, b int, c timestamp, d binary)
38 PREHOOK: type: CREATETABLE
39 PREHOOK: Output: database:default
40 PREHOOK: Output: default@insert_10_1
41 POSTHOOK: query: create table insert_10_1 (a float, b int, c timestamp, d binary)
42 POSTHOOK: type: CREATETABLE
43 POSTHOOK: Output: database:default
44 POSTHOOK: Output: default@insert_10_1
45 PREHOOK: query: explain vectorization detail
46 insert overwrite table insert_10_1
47 select cast(gpa as float),
49 IF(age>40,cast('2011-01-01 01:01:01' as timestamp),NULL),
50 IF(LENGTH(name)>10,cast(name as binary),NULL) from student_2_lines
52 POSTHOOK: query: explain vectorization detail
53 insert overwrite table insert_10_1
54 select cast(gpa as float),
56 IF(age>40,cast('2011-01-01 01:01:01' as timestamp),NULL),
57 IF(LENGTH(name)>10,cast(name as binary),NULL) from student_2_lines
61 enabledConditionsMet: [hive.vectorized.execution.enabled IS true]
64 Stage-1 is a root stage
65 Stage-2 depends on stages: Stage-1
66 Stage-0 depends on stages: Stage-2
67 Stage-3 depends on stages: Stage-0
72 #### A masked pattern was here ####
77 alias: student_2_lines
78 Statistics: Num rows: 2 Data size: 392 Basic stats: COMPLETE Column stats: NONE
79 TableScan Vectorization:
81 vectorizationSchemaColumns: [0:name:string, 1:age:int, 2:gpa:double, 3:ROW__ID:struct<transactionid:bigint,bucketid:int,rowid:bigint>]
83 expressions: UDFToFloat(gpa) (type: float), age (type: int), if((age > 40), TIMESTAMP'2011-01-01 01:01:01.0', null) (type: timestamp), if((length(name) > 10), CAST( name AS BINARY), null) (type: binary)
84 outputColumnNames: _col0, _col1, _col2, _col3
86 className: VectorSelectOperator
88 projectedOutputColumnNums: [2, 1, 5, 8]
89 selectExpressions: VectorUDFAdaptor(if((age > 40), TIMESTAMP'2011-01-01 01:01:01.0', null))(children: LongColGreaterLongScalar(col 1:int, val 40) -> 4:boolean) -> 5:timestamp, VectorUDFAdaptor(if((length(name) > 10), CAST( name AS BINARY), null))(children: LongColGreaterLongScalar(col 4:int, val 10)(children: StringLength(col 0:string) -> 4:int) -> 6:boolean, VectorUDFAdaptor(CAST( name AS BINARY)) -> 7:binary) -> 8:binary
90 Statistics: Num rows: 2 Data size: 392 Basic stats: COMPLETE Column stats: NONE
93 File Sink Vectorization:
94 className: VectorFileSinkOperator
96 Statistics: Num rows: 2 Data size: 392 Basic stats: COMPLETE Column stats: NONE
98 input format: org.apache.hadoop.mapred.TextInputFormat
99 output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
100 serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
101 name: default.insert_10_1
102 Execution mode: vectorized, llap
106 enabledConditionsMet: hive.vectorized.use.vector.serde.deserialize IS true
107 inputFormatFeatureSupport: [DECIMAL_64]
108 vectorizationSupportRemovedReasons: [DECIMAL_64 disabled because LLAP is enabled]
109 featureSupportInUse: []
110 inputFileFormats: org.apache.hadoop.mapred.TextInputFormat
112 usesVectorUDFAdaptor: true
116 includeColumns: [0, 1, 2]
117 dataColumns: name:string, age:int, gpa:double
118 partitionColumnCount: 0
119 scratchColumnTypeNames: [bigint, timestamp, bigint, string, string]
122 Dependency Collection
129 input format: org.apache.hadoop.mapred.TextInputFormat
130 output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
131 serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
132 name: default.insert_10_1
138 PREHOOK: query: insert overwrite table insert_10_1
139 select cast(gpa as float),
141 IF(age>40,cast('2011-01-01 01:01:01' as timestamp),NULL),
142 IF(LENGTH(name)>10,cast(name as binary),NULL) from student_2_lines
144 PREHOOK: Input: default@student_2_lines
145 PREHOOK: Output: default@insert_10_1
146 POSTHOOK: query: insert overwrite table insert_10_1
147 select cast(gpa as float),
149 IF(age>40,cast('2011-01-01 01:01:01' as timestamp),NULL),
150 IF(LENGTH(name)>10,cast(name as binary),NULL) from student_2_lines
151 POSTHOOK: type: QUERY
152 POSTHOOK: Input: default@student_2_lines
153 POSTHOOK: Output: default@insert_10_1
154 POSTHOOK: Lineage: insert_10_1.a EXPRESSION [(student_2_lines)student_2_lines.FieldSchema(name:gpa, type:double, comment:null), ]
155 POSTHOOK: Lineage: insert_10_1.b SIMPLE [(student_2_lines)student_2_lines.FieldSchema(name:age, type:int, comment:null), ]
156 POSTHOOK: Lineage: insert_10_1.c EXPRESSION [(student_2_lines)student_2_lines.FieldSchema(name:age, type:int, comment:null), ]
157 POSTHOOK: Lineage: insert_10_1.d EXPRESSION [(student_2_lines)student_2_lines.FieldSchema(name:name, type:string, comment:null), ]