PageRenderTime 51ms CodeModel.GetById 17ms app.highlight 17ms RepoModel.GetById 2ms app.codeStats 1ms

/tags/release-0.2.0-rc0/hive/external/ql/src/test/results/clientpositive/bucketmapjoin4.q.out

#
text | 1013 lines | 989 code | 24 blank | 0 comment | 0 complexity | 570d96aceb6cb4a11e968199a42b5df6 MD5 | raw file

Large files files are truncated, but you can click here to view the full file

  1PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  2PREHOOK: type: CREATETABLE
  3POSTHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  4POSTHOOK: type: CREATETABLE
  5POSTHOOK: Output: default@srcbucket_mapjoin
  6PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  7PREHOOK: type: LOAD
  8PREHOOK: Output: default@srcbucket_mapjoin
  9POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
 10POSTHOOK: type: LOAD
 11POSTHOOK: Output: default@srcbucket_mapjoin
 12PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
 13PREHOOK: type: LOAD
 14PREHOOK: Output: default@srcbucket_mapjoin
 15POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
 16POSTHOOK: type: LOAD
 17POSTHOOK: Output: default@srcbucket_mapjoin
 18PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
 19PREHOOK: type: CREATETABLE
 20POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
 21POSTHOOK: type: CREATETABLE
 22POSTHOOK: Output: default@srcbucket_mapjoin_part
 23PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 24PREHOOK: type: LOAD
 25PREHOOK: Output: default@srcbucket_mapjoin_part
 26POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 27POSTHOOK: type: LOAD
 28POSTHOOK: Output: default@srcbucket_mapjoin_part
 29POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 30PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 31PREHOOK: type: LOAD
 32PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 33POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 34POSTHOOK: type: LOAD
 35POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 36PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 37PREHOOK: type: LOAD
 38PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 39POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 40POSTHOOK: type: LOAD
 41POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 42PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 43PREHOOK: type: LOAD
 44PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 45POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 46POSTHOOK: type: LOAD
 47POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 48PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
 49PREHOOK: type: CREATETABLE
 50POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
 51POSTHOOK: type: CREATETABLE
 52POSTHOOK: Output: default@srcbucket_mapjoin_part_2
 53PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 54PREHOOK: type: LOAD
 55PREHOOK: Output: default@srcbucket_mapjoin_part_2
 56POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 57POSTHOOK: type: LOAD
 58POSTHOOK: Output: default@srcbucket_mapjoin_part_2
 59POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
 60PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 61PREHOOK: type: LOAD
 62PREHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
 63POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 64POSTHOOK: type: LOAD
 65POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
 66PREHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
 67PREHOOK: type: CREATETABLE
 68POSTHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
 69POSTHOOK: type: CREATETABLE
 70POSTHOOK: Output: default@bucketmapjoin_hash_result_1
 71PREHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
 72PREHOOK: type: CREATETABLE
 73POSTHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
 74POSTHOOK: type: CREATETABLE
 75POSTHOOK: Output: default@bucketmapjoin_hash_result_2
 76PREHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
 77PREHOOK: type: CREATETABLE
 78POSTHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
 79POSTHOOK: type: CREATETABLE
 80POSTHOOK: Output: default@bucketmapjoin_tmp_result
 81PREHOOK: query: explain extended
 82insert overwrite table bucketmapjoin_tmp_result
 83select /*+mapjoin(b)*/ a.key, a.value, b.value
 84from srcbucket_mapjoin a join srcbucket_mapjoin b
 85on a.key=b.key
 86PREHOOK: type: QUERY
 87POSTHOOK: query: explain extended
 88insert overwrite table bucketmapjoin_tmp_result
 89select /*+mapjoin(b)*/ a.key, a.value, b.value
 90from srcbucket_mapjoin a join srcbucket_mapjoin b
 91on a.key=b.key
 92POSTHOOK: type: QUERY
 93ABSTRACT SYNTAX TREE:
 94  (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) b) (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST b))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
 95
 96STAGE DEPENDENCIES:
 97  Stage-7 is a root stage
 98  Stage-1 depends on stages: Stage-7
 99  Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
100  Stage-4
101  Stage-0 depends on stages: Stage-4, Stage-3
102  Stage-2 depends on stages: Stage-0
103  Stage-3
104
105STAGE PLANS:
106  Stage: Stage-7
107    Map Reduce Local Work
108      Alias -> Map Local Tables:
109        b 
110          Fetch Operator
111            limit: -1
112      Alias -> Map Local Operator Tree:
113        b 
114          TableScan
115            alias: b
116            GatherStats: false
117            HashTable Sink Operator
118              condition expressions:
119                0 {key} {value}
120                1 {value}
121              handleSkewJoin: false
122              keys:
123                0 [Column[key]]
124                1 [Column[key]]
125              Position of Big Table: 0
126      Bucket Mapjoin Context:
127          Alias Bucket Base File Name Mapping:
128            b {srcbucket20.txt=[srcbucket20.txt], srcbucket21.txt=[srcbucket21.txt]}
129          Alias Bucket File Name Mapping:
130            b {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt]}
131          Alias Bucket Output File Name Mapping:
132            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt 0
133            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt 1
134
135  Stage: Stage-1
136    Map Reduce
137      Alias -> Map Operator Tree:
138        a 
139          TableScan
140            alias: a
141            GatherStats: false
142            Map Join Operator
143              condition map:
144                   Inner Join 0 to 1
145              condition expressions:
146                0 {key} {value}
147                1 {value}
148              handleSkewJoin: false
149              keys:
150                0 [Column[key]]
151                1 [Column[key]]
152              outputColumnNames: _col0, _col1, _col5
153              Position of Big Table: 0
154              Select Operator
155                expressions:
156                      expr: _col0
157                      type: int
158                      expr: _col1
159                      type: string
160                      expr: _col5
161                      type: string
162                outputColumnNames: _col0, _col1, _col5
163                Select Operator
164                  expressions:
165                        expr: _col0
166                        type: int
167                        expr: _col1
168                        type: string
169                        expr: _col5
170                        type: string
171                  outputColumnNames: _col0, _col1, _col2
172                  File Output Operator
173                    compressed: false
174                    GlobalTableId: 1
175                    directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002
176                    NumFilesPerFileSink: 1
177                    Stats Publishing Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000/
178                    table:
179                        input format: org.apache.hadoop.mapred.TextInputFormat
180                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
181                        properties:
182                          bucket_count -1
183                          columns key,value1,value2
184                          columns.types string:string:string
185                          file.inputformat org.apache.hadoop.mapred.TextInputFormat
186                          file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
187                          location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
188                          name default.bucketmapjoin_tmp_result
189                          serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
190                          serialization.format 1
191                          serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
192                          transient_lastDdlTime 1306979244
193                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
194                        name: default.bucketmapjoin_tmp_result
195                    TotalFiles: 1
196                    GatherStats: true
197                    MultiFileSpray: false
198      Local Work:
199        Map Reduce Local Work
200      Needs Tagging: false
201      Path -> Alias:
202        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin [a]
203      Path -> Partition:
204        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin 
205          Partition
206            base file name: srcbucket_mapjoin
207            input format: org.apache.hadoop.mapred.TextInputFormat
208            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
209            properties:
210              bucket_count 2
211              bucket_field_name key
212              columns key,value
213              columns.types int:string
214              file.inputformat org.apache.hadoop.mapred.TextInputFormat
215              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
216              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
217              name default.srcbucket_mapjoin
218              serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
219              serialization.format 1
220              serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
221              transient_lastDdlTime 1306979239
222            serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
223          
224              input format: org.apache.hadoop.mapred.TextInputFormat
225              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
226              properties:
227                bucket_count 2
228                bucket_field_name key
229                columns key,value
230                columns.types int:string
231                file.inputformat org.apache.hadoop.mapred.TextInputFormat
232                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
233                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
234                name default.srcbucket_mapjoin
235                serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
236                serialization.format 1
237                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
238                transient_lastDdlTime 1306979239
239              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
240              name: default.srcbucket_mapjoin
241            name: default.srcbucket_mapjoin
242
243  Stage: Stage-5
244    Conditional Operator
245
246  Stage: Stage-4
247    Move Operator
248      files:
249          hdfs directory: true
250          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002
251          destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000
252
253  Stage: Stage-0
254    Move Operator
255      tables:
256          replace: true
257          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000
258          table:
259              input format: org.apache.hadoop.mapred.TextInputFormat
260              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
261              properties:
262                bucket_count -1
263                columns key,value1,value2
264                columns.types string:string:string
265                file.inputformat org.apache.hadoop.mapred.TextInputFormat
266                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
267                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
268                name default.bucketmapjoin_tmp_result
269                serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
270                serialization.format 1
271                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
272                transient_lastDdlTime 1306979244
273              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
274              name: default.bucketmapjoin_tmp_result
275          tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10001
276
277  Stage: Stage-2
278    Stats-Aggr Operator
279      Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000/
280
281  Stage: Stage-3
282    Map Reduce
283      Alias -> Map Operator Tree:
284        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002 
285            File Output Operator
286              compressed: false
287              GlobalTableId: 0
288              directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000
289              NumFilesPerFileSink: 1
290              table:
291                  input format: org.apache.hadoop.mapred.TextInputFormat
292                  output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
293                  properties:
294                    bucket_count -1
295                    columns key,value1,value2
296                    columns.types string:string:string
297                    file.inputformat org.apache.hadoop.mapred.TextInputFormat
298                    file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
299                    location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
300                    name default.bucketmapjoin_tmp_result
301                    serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
302                    serialization.format 1
303                    serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
304                    transient_lastDdlTime 1306979244
305                  serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
306                  name: default.bucketmapjoin_tmp_result
307              TotalFiles: 1
308              GatherStats: false
309              MultiFileSpray: false
310      Needs Tagging: false
311      Path -> Alias:
312        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002]
313      Path -> Partition:
314        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002 
315          Partition
316            base file name: -ext-10002
317            input format: org.apache.hadoop.mapred.TextInputFormat
318            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
319            properties:
320              bucket_count -1
321              columns key,value1,value2
322              columns.types string:string:string
323              file.inputformat org.apache.hadoop.mapred.TextInputFormat
324              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
325              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
326              name default.bucketmapjoin_tmp_result
327              serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
328              serialization.format 1
329              serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
330              transient_lastDdlTime 1306979244
331            serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
332          
333              input format: org.apache.hadoop.mapred.TextInputFormat
334              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
335              properties:
336                bucket_count -1
337                columns key,value1,value2
338                columns.types string:string:string
339                file.inputformat org.apache.hadoop.mapred.TextInputFormat
340                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
341                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
342                name default.bucketmapjoin_tmp_result
343                serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
344                serialization.format 1
345                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
346                transient_lastDdlTime 1306979244
347              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
348              name: default.bucketmapjoin_tmp_result
349            name: default.bucketmapjoin_tmp_result
350
351
352PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
353select /*+mapjoin(b)*/ a.key, a.value, b.value
354from srcbucket_mapjoin a join srcbucket_mapjoin b
355on a.key=b.key
356PREHOOK: type: QUERY
357PREHOOK: Input: default@srcbucket_mapjoin
358PREHOOK: Output: default@bucketmapjoin_tmp_result
359POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
360select /*+mapjoin(b)*/ a.key, a.value, b.value
361from srcbucket_mapjoin a join srcbucket_mapjoin b
362on a.key=b.key
363POSTHOOK: type: QUERY
364POSTHOOK: Input: default@srcbucket_mapjoin
365POSTHOOK: Output: default@bucketmapjoin_tmp_result
366POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
367POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
368POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
369PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
370PREHOOK: type: QUERY
371PREHOOK: Input: default@bucketmapjoin_tmp_result
372PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-33_354_3111033757385788525/-mr-10000
373POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
374POSTHOOK: type: QUERY
375POSTHOOK: Input: default@bucketmapjoin_tmp_result
376POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-33_354_3111033757385788525/-mr-10000
377POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
378POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
379POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
380464
381PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
382select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
383PREHOOK: type: QUERY
384PREHOOK: Input: default@bucketmapjoin_tmp_result
385PREHOOK: Output: default@bucketmapjoin_hash_result_1
386POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
387select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
388POSTHOOK: type: QUERY
389POSTHOOK: Input: default@bucketmapjoin_tmp_result
390POSTHOOK: Output: default@bucketmapjoin_hash_result_1
391POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
392POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
393POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
394POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
395POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
396POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
397PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
398select /*+mapjoin(b)*/ a.key, a.value, b.value
399from srcbucket_mapjoin a join srcbucket_mapjoin b
400on a.key=b.key
401PREHOOK: type: QUERY
402PREHOOK: Input: default@srcbucket_mapjoin
403PREHOOK: Output: default@bucketmapjoin_tmp_result
404POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
405select /*+mapjoin(b)*/ a.key, a.value, b.value
406from srcbucket_mapjoin a join srcbucket_mapjoin b
407on a.key=b.key
408POSTHOOK: type: QUERY
409POSTHOOK: Input: default@srcbucket_mapjoin
410POSTHOOK: Output: default@bucketmapjoin_tmp_result
411POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
412POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
413POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
414POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
415POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
416POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
417POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
418POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
419POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
420PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
421PREHOOK: type: QUERY
422PREHOOK: Input: default@bucketmapjoin_tmp_result
423PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-49_331_2976822432880371649/-mr-10000
424POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
425POSTHOOK: type: QUERY
426POSTHOOK: Input: default@bucketmapjoin_tmp_result
427POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-49_331_2976822432880371649/-mr-10000
428POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
429POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
430POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
431POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
432POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
433POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
434POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
435POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
436POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
437464
438PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
439select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
440PREHOOK: type: QUERY
441PREHOOK: Input: default@bucketmapjoin_tmp_result
442PREHOOK: Output: default@bucketmapjoin_hash_result_2
443POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
444select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
445POSTHOOK: type: QUERY
446POSTHOOK: Input: default@bucketmapjoin_tmp_result
447POSTHOOK: Output: default@bucketmapjoin_hash_result_2
448POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
449POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
450POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
451POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
452POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
453POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
454POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
455POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
456POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
457POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
458POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
459POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
460PREHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
461from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
462on a.key = b.key
463PREHOOK: type: QUERY
464PREHOOK: Input: default@bucketmapjoin_hash_result_1
465PREHOOK: Input: default@bucketmapjoin_hash_result_2
466PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-56_317_7787039686001016086/-mr-10000
467POSTHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
468from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
469on a.key = b.key
470POSTHOOK: type: QUERY
471POSTHOOK: Input: default@bucketmapjoin_hash_result_1
472POSTHOOK: Input: default@bucketmapjoin_hash_result_2
473POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-56_317_7787039686001016086/-mr-10000
474POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
475POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
476POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
477POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
478POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
479POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
480POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
481POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
482POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
483POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
484POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
485POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
4860	0	0
487PREHOOK: query: explain extended
488insert overwrite table bucketmapjoin_tmp_result
489select /*+mapjoin(a)*/ a.key, a.value, b.value
490from srcbucket_mapjoin a join srcbucket_mapjoin b
491on a.key=b.key
492PREHOOK: type: QUERY
493POSTHOOK: query: explain extended
494insert overwrite table bucketmapjoin_tmp_result
495select /*+mapjoin(a)*/ a.key, a.value, b.value
496from srcbucket_mapjoin a join srcbucket_mapjoin b
497on a.key=b.key
498POSTHOOK: type: QUERY
499POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
500POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
501POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
502POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
503POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
504POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
505POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
506POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
507POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
508POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
509POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
510POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
511ABSTRACT SYNTAX TREE:
512  (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) b) (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST a))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
513
514STAGE DEPENDENCIES:
515  Stage-7 is a root stage
516  Stage-1 depends on stages: Stage-7
517  Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
518  Stage-4
519  Stage-0 depends on stages: Stage-4, Stage-3
520  Stage-2 depends on stages: Stage-0
521  Stage-3
522
523STAGE PLANS:
524  Stage: Stage-7
525    Map Reduce Local Work
526      Alias -> Map Local Tables:
527        a 
528          Fetch Operator
529            limit: -1
530      Alias -> Map Local Operator Tree:
531        a 
532          TableScan
533            alias: a
534            GatherStats: false
535            HashTable Sink Operator
536              condition expressions:
537                0 {key} {value}
538                1 {value}
539              handleSkewJoin: false
540              keys:
541                0 [Column[key]]
542                1 [Column[key]]
543              Position of Big Table: 1
544      Bucket Mapjoin Context:
545          Alias Bucket Base File Name Mapping:
546            a {srcbucket20.txt=[srcbucket20.txt], srcbucket21.txt=[srcbucket21.txt]}
547          Alias Bucket File Name Mapping:
548            a {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt]}
549          Alias Bucket Output File Name Mapping:
550            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt 0
551            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt 1
552
553  Stage: Stage-1
554    Map Reduce
555      Alias -> Map Operator Tree:
556        b 
557          TableScan
558            alias: b
559            GatherStats: false
560            Map Join Operator
561              condition map:
562                   Inner Join 0 to 1
563              condition expressions:
564                0 {key} {value}
565                1 {value}
566              handleSkewJoin: false
567              keys:
568                0 [Column[key]]
569                1 [Column[key]]
570              outputColumnNames: _col0, _col1, _col5
571              Position of Big Table: 1
572              Select Operator
573                expressions:
574                      expr: _col0
575                      type: int
576                      expr: _col1
577                      type: string
578                      expr: _col5
579                      type: string
580                outputColumnNames: _col0, _col1, _col5
581                Select Operator
582                  expressions:
583                        expr: _col0
584                        type: int
585                        expr: _col1
586                        type: string
587                        expr: _col5
588                        type: string
589                  outputColumnNames: _col0, _col1, _col2
590                  File Output Operator
591                    compressed: false
592                    GlobalTableId: 1
593                    directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002
594                    NumFilesPerFileSink: 1
595                    Stats Publishing Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000/
596                    table:
597                        input format: org.apache.hadoop.mapred.TextInputFormat
598                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
599                        properties:
600                          bucket_count -1
601                          columns key,value1,value2
602                          columns.types string:string:string
603                          file.inputformat org.apache.hadoop.mapred.TextInputFormat
604                          file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
605                          location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
606                          name default.bucketmapjoin_tmp_result
607                          numFiles 1
608                          numPartitions 0
609                          numRows 464
610                          rawDataSize 8519
611                          serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
612                          serialization.format 1
613                          serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
614                          totalSize 8983
615                          transient_lastDdlTime 1306979269
616                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
617                        name: default.bucketmapjoin_tmp_result
618                    TotalFiles: 1
619                    GatherStats: true
620                    MultiFileSpray: false
621      Local Work:
622        Map Reduce Local Work
623      Needs Tagging: false
624      Path -> Alias:
625        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin [b]
626      Path -> Partition:
627        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin 
628          Partition
629            base file name: srcbucket_mapjoin
630            input format: org.apache.hadoop.mapred.TextInputFormat
631            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
632            properties:
633              bucket_count 2
634              bucket_field_name key
635              columns key,value
636              columns.types int:string
637              file.inputformat org.apache.hadoop.mapred.TextInputFormat
638              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
639              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
640              name default.srcbucket_mapjoin
641              serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
642              serialization.format 1
643              serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
644              transient_lastDdlTime 1306979239
645            serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
646          
647              input format: org.apache.hadoop.mapred.TextInputFormat
648              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
649              properties:
650                bucket_count 2
651                bucket_field_name key
652                columns key,value
653                columns.types int:string
654                file.inputformat org.apache.hadoop.mapred.TextInputFormat
655                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
656                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
657                name default.srcbucket_mapjoin
658                serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
659                serialization.format 1
660                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
661                transient_lastDdlTime 1306979239
662              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
663              name: default.srcbucket_mapjoin
664            name: default.srcbucket_mapjoin
665
666  Stage: Stage-5
667    Conditional Operator
668
669  Stage: Stage-4
670    Move Operator
671      files:
672          hdfs directory: true
673          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002
674          destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000
675
676  Stage: Stage-0
677    Move Operator
678      tables:
679          replace: true
680          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000
681          table:
682              input format: org.apache.hadoop.mapred.TextInputFormat
683              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
684              properties:
685                bucket_count -1
686                columns key,value1,value2
687                columns.types string:string:string
688                file.inputformat org.apache.hadoop.mapred.TextInputFormat
689                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
690                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
691                name default.bucketmapjoin_tmp_result
692                numFiles 1
693                numPartitions 0
694                numRows 464
695                rawDataSize 8519
696                serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
697                serialization.format 1
698                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
699                totalSize 8983
700                transient_lastDdlTime 1306979269
701              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
702              name: default.bucketmapjoin_tmp_result
703          tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10001
704
705  Stage: Stage-2
706    Stats-Aggr Operator
707      Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000/
708
709  Stage: Stage-3
710    Map Reduce
711      Alias -> Map Operator Tree:
712        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002 
713            File Output Operator
714              compressed: false
715              GlobalTableId: 0
716              directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000
717              NumFilesPerFileSink: 1
718              table:
719                  input format: org.apache.hadoop.mapred.TextInputFormat
720                  output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
721                  properties:
722                    bucket_count -1
723                    columns key,value1,value2
724                    columns.types string:string:string
725                    file.inputformat org.apache.hadoop.mapred.TextInputFormat
726                    file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
727                    location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
728                    name default.bucketmapjoin_tmp_result
729                    numFiles 1
730                    numPartitions 0
731                    numRows 464
732                    rawDataSize 8519
733                    serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
734                    serialization.format 1
735                    serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
736                    totalSize 8983
737                    transient_lastDdlTime 1306979269
738                  serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
739                  name: default.bucketmapjoin_tmp_result
740              TotalFiles: 1
741              GatherStats: false
742              MultiFileSpray: false
743      Needs Tagging: false
744      Path -> Alias:
745        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002]
746      Path -> Partition:
747        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002 
748          Partition
749            base file name: -ext-10002
750            input format: org.apache.hadoop.mapred.TextInputFormat
751            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
752            properties:
753              bucket_count -1
754              columns key,value1,value2
755              columns.types string:string:string
756              file.inputformat org.apache.hadoop.mapred.TextInputFormat
757              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
758              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
759              name default.bucketmapjoin_tmp_result
760              numFiles 1
761              numPartitions 0
762              numRows 464
763              rawDataSize 8519
764              serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
765              serialization.format 1
766              serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
767              totalSize 8983
768              transient_lastDdlTime 1306979269
769            serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
770          
771              input format: org.apache.hadoop.mapred.TextInputFormat
772              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
773              properties:
774                bucket_count -1
775                columns key,value1,value2
776                columns.types string:string:string
777                file.inputformat org.apache.hadoop.mapred.TextInputFormat
778                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
779                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
780                name default.bucketmapjoin_tmp_result
781                numFiles 1
782                numPartitions 0
783                numRows 464
784                rawDataSize 8519
785                serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
786                serialization.format 1
787                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
788                totalSize 8983
789                transient_lastDdlTime 1306979269
790              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
791              name: default.bucketmapjoin_tmp_result
792            name: default.bucketmapjoin_tmp_result
793
794
795PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
796select /*+mapjoin(a)*/ a.key, a.value, b.value
797from srcbucket_mapjoin a join srcbucket_mapjoin b
798on a.key=b.key
799PREHOOK: type: QUERY
800PREHOOK: Input: default@srcbucket_mapjoin
801PREHOOK: Output: default@bucketmapjoin_tmp_result
802POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
803select /*+mapjoin(a)*/ a.key, a.value, b.value
804from srcbucket_mapjoin a join srcbucket_mapjoin b
805on a.key=b.key
806POSTHOOK: type: QUERY
807POSTHOOK: Input: default@srcbucket_mapjoin
808POSTHOOK: Output: default@bucketmapjoin_tmp_result
809POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
810POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
811POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
812POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null…

Large files files are truncated, but you can click here to view the full file