PageRenderTime 32ms CodeModel.GetById 19ms app.highlight 7ms RepoModel.GetById 1ms app.codeStats 1ms

/tags/release-0.2.0-rc0/hive/external/ql/src/test/results/clientpositive/bucketmapjoin3.q.out

#
text | 1031 lines | 1007 code | 24 blank | 0 comment | 0 complexity | f51fdcb56bf6cbad98bc2dd47d4c0869 MD5 | raw file

Large files files are truncated, but you can click here to view the full file

  1PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  2PREHOOK: type: CREATETABLE
  3POSTHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  4POSTHOOK: type: CREATETABLE
  5POSTHOOK: Output: default@srcbucket_mapjoin
  6PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  7PREHOOK: type: LOAD
  8PREHOOK: Output: default@srcbucket_mapjoin
  9POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
 10POSTHOOK: type: LOAD
 11POSTHOOK: Output: default@srcbucket_mapjoin
 12PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
 13PREHOOK: type: LOAD
 14PREHOOK: Output: default@srcbucket_mapjoin
 15POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
 16POSTHOOK: type: LOAD
 17POSTHOOK: Output: default@srcbucket_mapjoin
 18PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
 19PREHOOK: type: CREATETABLE
 20POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
 21POSTHOOK: type: CREATETABLE
 22POSTHOOK: Output: default@srcbucket_mapjoin_part
 23PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 24PREHOOK: type: LOAD
 25PREHOOK: Output: default@srcbucket_mapjoin_part
 26POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 27POSTHOOK: type: LOAD
 28POSTHOOK: Output: default@srcbucket_mapjoin_part
 29POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 30PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 31PREHOOK: type: LOAD
 32PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 33POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 34POSTHOOK: type: LOAD
 35POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 36PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 37PREHOOK: type: LOAD
 38PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 39POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 40POSTHOOK: type: LOAD
 41POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 42PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 43PREHOOK: type: LOAD
 44PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 45POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
 46POSTHOOK: type: LOAD
 47POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
 48PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
 49PREHOOK: type: CREATETABLE
 50POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
 51POSTHOOK: type: CREATETABLE
 52POSTHOOK: Output: default@srcbucket_mapjoin_part_2
 53PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 54PREHOOK: type: LOAD
 55PREHOOK: Output: default@srcbucket_mapjoin_part_2
 56POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 57POSTHOOK: type: LOAD
 58POSTHOOK: Output: default@srcbucket_mapjoin_part_2
 59POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
 60PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 61PREHOOK: type: LOAD
 62PREHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
 63POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
 64POSTHOOK: type: LOAD
 65POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
 66PREHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
 67PREHOOK: type: CREATETABLE
 68POSTHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
 69POSTHOOK: type: CREATETABLE
 70POSTHOOK: Output: default@bucketmapjoin_hash_result_1
 71PREHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
 72PREHOOK: type: CREATETABLE
 73POSTHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
 74POSTHOOK: type: CREATETABLE
 75POSTHOOK: Output: default@bucketmapjoin_hash_result_2
 76PREHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
 77PREHOOK: type: CREATETABLE
 78POSTHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
 79POSTHOOK: type: CREATETABLE
 80POSTHOOK: Output: default@bucketmapjoin_tmp_result
 81PREHOOK: query: explain extended
 82insert overwrite table bucketmapjoin_tmp_result 
 83select /*+mapjoin(b)*/ a.key, a.value, b.value 
 84from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
 85on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
 86PREHOOK: type: QUERY
 87POSTHOOK: query: explain extended
 88insert overwrite table bucketmapjoin_tmp_result 
 89select /*+mapjoin(b)*/ a.key, a.value, b.value 
 90from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
 91on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
 92POSTHOOK: type: QUERY
 93ABSTRACT SYNTAX TREE:
 94  (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part_2) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (and (and (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)) (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08")) (= (. (TOK_TABLE_OR_COL a) ds) "2008-04-08")))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST b))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
 95
 96STAGE DEPENDENCIES:
 97  Stage-7 is a root stage
 98  Stage-1 depends on stages: Stage-7
 99  Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
100  Stage-4
101  Stage-0 depends on stages: Stage-4, Stage-3
102  Stage-2 depends on stages: Stage-0
103  Stage-3
104
105STAGE PLANS:
106  Stage: Stage-7
107    Map Reduce Local Work
108      Alias -> Map Local Tables:
109        b 
110          Fetch Operator
111            limit: -1
112      Alias -> Map Local Operator Tree:
113        b 
114          TableScan
115            alias: b
116            GatherStats: false
117            HashTable Sink Operator
118              condition expressions:
119                0 {key} {value}
120                1 {value}
121              handleSkewJoin: false
122              keys:
123                0 [Column[key]]
124                1 [Column[key]]
125              Position of Big Table: 0
126      Bucket Mapjoin Context:
127          Alias Bucket Base File Name Mapping:
128            b {srcbucket22.txt=[srcbucket20.txt, srcbucket22.txt], srcbucket23.txt=[srcbucket21.txt, srcbucket23.txt]}
129          Alias Bucket File Name Mapping:
130            b {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt, pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt, pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt]}
131          Alias Bucket Output File Name Mapping:
132            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt 0
133            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt 1
134
135  Stage: Stage-1
136    Map Reduce
137      Alias -> Map Operator Tree:
138        a 
139          TableScan
140            alias: a
141            GatherStats: false
142            Map Join Operator
143              condition map:
144                   Inner Join 0 to 1
145              condition expressions:
146                0 {key} {value}
147                1 {value}
148              handleSkewJoin: false
149              keys:
150                0 [Column[key]]
151                1 [Column[key]]
152              outputColumnNames: _col0, _col1, _col6
153              Position of Big Table: 0
154              Select Operator
155                expressions:
156                      expr: _col0
157                      type: int
158                      expr: _col1
159                      type: string
160                      expr: _col6
161                      type: string
162                outputColumnNames: _col0, _col1, _col6
163                Select Operator
164                  expressions:
165                        expr: _col0
166                        type: int
167                        expr: _col1
168                        type: string
169                        expr: _col6
170                        type: string
171                  outputColumnNames: _col0, _col1, _col2
172                  File Output Operator
173                    compressed: false
174                    GlobalTableId: 1
175                    directory: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-34-40_179_2078859592920140854/-ext-10002
176                    NumFilesPerFileSink: 1
177                    Stats Publishing Key Prefix: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-34-40_179_2078859592920140854/-ext-10000/
178                    table:
179                        input format: org.apache.hadoop.mapred.TextInputFormat
180                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
181                        properties:
182                          bucket_count -1
183                          columns key,value1,value2
184                          columns.types string:string:string
185                          file.inputformat org.apache.hadoop.mapred.TextInputFormat
186                          file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
187                          location pfile:/home/amarsri/workspace/hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
188                          name default.bucketmapjoin_tmp_result
189                          serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
190                          serialization.format 1
191                          serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
192                          transient_lastDdlTime 1310373280
193                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
194                        name: default.bucketmapjoin_tmp_result
195                    TotalFiles: 1
196                    GatherStats: true
197                    MultiFileSpray: false
198      Local Work:
199        Map Reduce Local Work
200      Needs Tagging: false
201      Path -> Alias:
202        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08 [a]
203      Path -> Partition:
204        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08 
205          Partition
206            base file name: ds=2008-04-08
207            input format: org.apache.hadoop.mapred.TextInputFormat
208            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
209            partition values:
210              ds 2008-04-08
211            properties:
212              bucket_count 2
213              bucket_field_name key
214              columns key,value
215              columns.types int:string
216              file.inputformat org.apache.hadoop.mapred.TextInputFormat
217              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
218              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08
219              name default.srcbucket_mapjoin_part_2
220              partition_columns ds
221              serialization.ddl struct srcbucket_mapjoin_part_2 { i32 key, string value}
222              serialization.format 1
223              serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
224              transient_lastDdlTime 1306979174
225            serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
226          
227              input format: org.apache.hadoop.mapred.TextInputFormat
228              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
229              properties:
230                bucket_count 2
231                bucket_field_name key
232                columns key,value
233                columns.types int:string
234                file.inputformat org.apache.hadoop.mapred.TextInputFormat
235                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
236                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2
237                name default.srcbucket_mapjoin_part_2
238                partition_columns ds
239                serialization.ddl struct srcbucket_mapjoin_part_2 { i32 key, string value}
240                serialization.format 1
241                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
242                transient_lastDdlTime 1306979173
243              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
244              name: default.srcbucket_mapjoin_part_2
245            name: default.srcbucket_mapjoin_part_2
246
247  Stage: Stage-5
248    Conditional Operator
249
250  Stage: Stage-4
251    Move Operator
252      files:
253          hdfs directory: true
254          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002
255          destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000
256
257  Stage: Stage-0
258    Move Operator
259      tables:
260          replace: true
261          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000
262          table:
263              input format: org.apache.hadoop.mapred.TextInputFormat
264              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
265              properties:
266                bucket_count -1
267                columns key,value1,value2
268                columns.types string:string:string
269                file.inputformat org.apache.hadoop.mapred.TextInputFormat
270                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
271                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
272                name default.bucketmapjoin_tmp_result
273                serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
274                serialization.format 1
275                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
276                transient_lastDdlTime 1306979174
277              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
278              name: default.bucketmapjoin_tmp_result
279          tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10001
280
281  Stage: Stage-2
282    Stats-Aggr Operator
283      Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000/
284
285  Stage: Stage-3
286    Map Reduce
287      Alias -> Map Operator Tree:
288        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002 
289            File Output Operator
290              compressed: false
291              GlobalTableId: 0
292              directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000
293              NumFilesPerFileSink: 1
294              table:
295                  input format: org.apache.hadoop.mapred.TextInputFormat
296                  output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
297                  properties:
298                    bucket_count -1
299                    columns key,value1,value2
300                    columns.types string:string:string
301                    file.inputformat org.apache.hadoop.mapred.TextInputFormat
302                    file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
303                    location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
304                    name default.bucketmapjoin_tmp_result
305                    serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
306                    serialization.format 1
307                    serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
308                    transient_lastDdlTime 1306979174
309                  serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
310                  name: default.bucketmapjoin_tmp_result
311              TotalFiles: 1
312              GatherStats: false
313              MultiFileSpray: false
314      Needs Tagging: false
315      Path -> Alias:
316        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002]
317      Path -> Partition:
318        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002 
319          Partition
320            base file name: -ext-10002
321            input format: org.apache.hadoop.mapred.TextInputFormat
322            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
323            properties:
324              bucket_count -1
325              columns key,value1,value2
326              columns.types string:string:string
327              file.inputformat org.apache.hadoop.mapred.TextInputFormat
328              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
329              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
330              name default.bucketmapjoin_tmp_result
331              serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
332              serialization.format 1
333              serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
334              transient_lastDdlTime 1306979174
335            serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
336          
337              input format: org.apache.hadoop.mapred.TextInputFormat
338              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
339              properties:
340                bucket_count -1
341                columns key,value1,value2
342                columns.types string:string:string
343                file.inputformat org.apache.hadoop.mapred.TextInputFormat
344                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
345                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
346                name default.bucketmapjoin_tmp_result
347                serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
348                serialization.format 1
349                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
350                transient_lastDdlTime 1306979174
351              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
352              name: default.bucketmapjoin_tmp_result
353            name: default.bucketmapjoin_tmp_result
354
355
356PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result 
357select /*+mapjoin(b)*/ a.key, a.value, b.value 
358from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
359on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
360PREHOOK: type: QUERY
361PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
362PREHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
363PREHOOK: Output: default@bucketmapjoin_tmp_result
364POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result 
365select /*+mapjoin(b)*/ a.key, a.value, b.value 
366from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
367on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
368POSTHOOK: type: QUERY
369POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
370POSTHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
371POSTHOOK: Output: default@bucketmapjoin_tmp_result
372POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
373POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
374POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
375PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
376PREHOOK: type: QUERY
377PREHOOK: Input: default@bucketmapjoin_tmp_result
378PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-21_973_1112542633479425376/-mr-10000
379POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
380POSTHOOK: type: QUERY
381POSTHOOK: Input: default@bucketmapjoin_tmp_result
382POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-21_973_1112542633479425376/-mr-10000
383POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
384POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
385POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
386564
387PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
388select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
389PREHOOK: type: QUERY
390PREHOOK: Input: default@bucketmapjoin_tmp_result
391PREHOOK: Output: default@bucketmapjoin_hash_result_1
392POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
393select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
394POSTHOOK: type: QUERY
395POSTHOOK: Input: default@bucketmapjoin_tmp_result
396POSTHOOK: Output: default@bucketmapjoin_hash_result_1
397POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
398POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
399POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
400POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
401POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
402POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
403PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result 
404select /*+mapjoin(b)*/ a.key, a.value, b.value 
405from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
406on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
407PREHOOK: type: QUERY
408PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
409PREHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
410PREHOOK: Output: default@bucketmapjoin_tmp_result
411POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result 
412select /*+mapjoin(b)*/ a.key, a.value, b.value 
413from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
414on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
415POSTHOOK: type: QUERY
416POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
417POSTHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
418POSTHOOK: Output: default@bucketmapjoin_tmp_result
419POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
420POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
421POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
422POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
423POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
424POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
425POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
426POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
427POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
428PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
429PREHOOK: type: QUERY
430PREHOOK: Input: default@bucketmapjoin_tmp_result
431PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-35_394_5427265786129780250/-mr-10000
432POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
433POSTHOOK: type: QUERY
434POSTHOOK: Input: default@bucketmapjoin_tmp_result
435POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-35_394_5427265786129780250/-mr-10000
436POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
437POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
438POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
439POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
440POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
441POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
442POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
443POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
444POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
445564
446PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
447select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
448PREHOOK: type: QUERY
449PREHOOK: Input: default@bucketmapjoin_tmp_result
450PREHOOK: Output: default@bucketmapjoin_hash_result_2
451POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
452select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
453POSTHOOK: type: QUERY
454POSTHOOK: Input: default@bucketmapjoin_tmp_result
455POSTHOOK: Output: default@bucketmapjoin_hash_result_2
456POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
457POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
458POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
459POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
460POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
461POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
462POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
463POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
464POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
465POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
466POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
467POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
468PREHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
469from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
470on a.key = b.key
471PREHOOK: type: QUERY
472PREHOOK: Input: default@bucketmapjoin_hash_result_1
473PREHOOK: Input: default@bucketmapjoin_hash_result_2
474PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-42_543_1855526648690468691/-mr-10000
475POSTHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
476from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
477on a.key = b.key
478POSTHOOK: type: QUERY
479POSTHOOK: Input: default@bucketmapjoin_hash_result_1
480POSTHOOK: Input: default@bucketmapjoin_hash_result_2
481POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-42_543_1855526648690468691/-mr-10000
482POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
483POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
484POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
485POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
486POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
487POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
488POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
489POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
490POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
491POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
492POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
493POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
4940	0	0
495PREHOOK: query: explain extended 
496insert overwrite table bucketmapjoin_tmp_result 
497select /*+mapjoin(a)*/ a.key, a.value, b.value 
498from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
499on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
500PREHOOK: type: QUERY
501POSTHOOK: query: explain extended 
502insert overwrite table bucketmapjoin_tmp_result 
503select /*+mapjoin(a)*/ a.key, a.value, b.value 
504from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b 
505on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
506POSTHOOK: type: QUERY
507POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
508POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
509POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
510POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
511POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
512POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
513POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
514POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
515POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
516POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
517POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
518POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
519ABSTRACT SYNTAX TREE:
520  (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part_2) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (and (and (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)) (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08")) (= (. (TOK_TABLE_OR_COL a) ds) "2008-04-08")))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST a))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
521
522STAGE DEPENDENCIES:
523  Stage-7 is a root stage
524  Stage-1 depends on stages: Stage-7
525  Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
526  Stage-4
527  Stage-0 depends on stages: Stage-4, Stage-3
528  Stage-2 depends on stages: Stage-0
529  Stage-3
530
531STAGE PLANS:
532  Stage: Stage-7
533    Map Reduce Local Work
534      Alias -> Map Local Tables:
535        a 
536          Fetch Operator
537            limit: -1
538      Alias -> Map Local Operator Tree:
539        a 
540          TableScan
541            alias: a
542            GatherStats: false
543            HashTable Sink Operator
544              condition expressions:
545                0 {key} {value}
546                1 {value}
547              handleSkewJoin: false
548              keys:
549                0 [Column[key]]
550                1 [Column[key]]
551              Position of Big Table: 1
552      Bucket Mapjoin Context:
553          Alias Bucket Base File Name Mapping:
554            a {srcbucket20.txt=[srcbucket22.txt], srcbucket21.txt=[srcbucket23.txt], srcbucket22.txt=[srcbucket22.txt], srcbucket23.txt=[srcbucket23.txt]}
555          Alias Bucket File Name Mapping:
556            a {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt]}
557          Alias Bucket Output File Name Mapping:
558            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt 0
559            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt 1
560            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt 2
561            pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt 3
562
563  Stage: Stage-1
564    Map Reduce
565      Alias -> Map Operator Tree:
566        b 
567          TableScan
568            alias: b
569            GatherStats: false
570            Map Join Operator
571              condition map:
572                   Inner Join 0 to 1
573              condition expressions:
574                0 {key} {value}
575                1 {value}
576              handleSkewJoin: false
577              keys:
578                0 [Column[key]]
579                1 [Column[key]]
580              outputColumnNames: _col0, _col1, _col6
581              Position of Big Table: 1
582              Select Operator
583                expressions:
584                      expr: _col0
585                      type: int
586                      expr: _col1
587                      type: string
588                      expr: _col6
589                      type: string
590                outputColumnNames: _col0, _col1, _col6
591                Select Operator
592                  expressions:
593                        expr: _col0
594                        type: int
595                        expr: _col1
596                        type: string
597                        expr: _col6
598                        type: string
599                  outputColumnNames: _col0, _col1, _col2
600                  File Output Operator
601                    compressed: false
602                    GlobalTableId: 1
603                    directory: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-35-06_760_1506759328569853293/-ext-10002
604                    NumFilesPerFileSink: 1
605                    Stats Publishing Key Prefix: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-35-06_760_1506759328569853293/-ext-10000/
606                    table:
607                        input format: org.apache.hadoop.mapred.TextInputFormat
608                        output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
609                        properties:
610                          bucket_count -1
611                          columns key,value1,value2
612                          columns.types string:string:string
613                          file.inputformat org.apache.hadoop.mapred.TextInputFormat
614                          file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
615                          location pfile:/home/amarsri/workspace/hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
616                          name default.bucketmapjoin_tmp_result
617                          numFiles 1
618                          numPartitions 0
619                          numRows 564
620                          rawDataSize 10503
621                          serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
622                          serialization.format 1
623                          serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
624                          totalSize 11067
625                          transient_lastDdlTime 1310373297
626                        serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
627                        name: default.bucketmapjoin_tmp_result
628                    TotalFiles: 1
629                    GatherStats: true
630                    MultiFileSpray: false
631      Local Work:
632        Map Reduce Local Work
633      Needs Tagging: false
634      Path -> Alias:
635        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08 [b]
636      Path -> Partition:
637        pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08 
638          Partition
639            base file name: ds=2008-04-08
640            input format: org.apache.hadoop.mapred.TextInputFormat
641            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
642            partition values:
643              ds 2008-04-08
644            properties:
645              bucket_count 4
646              bucket_field_name key
647              columns key,value
648              columns.types int:string
649              file.inputformat org.apache.hadoop.mapred.TextInputFormat
650              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
651              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08
652              name default.srcbucket_mapjoin_part
653              partition_columns ds
654              serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
655              serialization.format 1
656              serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
657              transient_lastDdlTime 1306979173
658            serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
659          
660              input format: org.apache.hadoop.mapred.TextInputFormat
661              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
662              properties:
663                bucket_count 4
664                bucket_field_name key
665                columns key,value
666                columns.types int:string
667                file.inputformat org.apache.hadoop.mapred.TextInputFormat
668                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
669                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part
670                name default.srcbucket_mapjoin_part
671                partition_columns ds
672                serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
673                serialization.format 1
674                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
675                transient_lastDdlTime 1306979170
676              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
677              name: default.srcbucket_mapjoin_part
678            name: default.srcbucket_mapjoin_part
679
680  Stage: Stage-5
681    Conditional Operator
682
683  Stage: Stage-4
684    Move Operator
685      files:
686          hdfs directory: true
687          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002
688          destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000
689
690  Stage: Stage-0
691    Move Operator
692      tables:
693          replace: true
694          source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000
695          table:
696              input format: org.apache.hadoop.mapred.TextInputFormat
697              output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
698              properties:
699                bucket_count -1
700                columns key,value1,value2
701                columns.types string:string:string
702                file.inputformat org.apache.hadoop.mapred.TextInputFormat
703                file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
704                location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
705                name default.bucketmapjoin_tmp_result
706                numFiles 1
707                numPartitions 0
708                numRows 564
709                rawDataSize 10503
710                serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
711                serialization.format 1
712                serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
713                totalSize 11067
714                transient_lastDdlTime 1306979195
715              serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
716              name: default.bucketmapjoin_tmp_result
717          tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10001
718
719  Stage: Stage-2
720    Stats-Aggr Operator
721      Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000/
722
723  Stage: Stage-3
724    Map Reduce
725      Alias -> Map Operator Tree:
726        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002 
727            File Output Operator
728              compressed: false
729              GlobalTableId: 0
730              directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000
731              NumFilesPerFileSink: 1
732              table:
733                  input format: org.apache.hadoop.mapred.TextInputFormat
734                  output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
735                  properties:
736                    bucket_count -1
737                    columns key,value1,value2
738                    columns.types string:string:string
739                    file.inputformat org.apache.hadoop.mapred.TextInputFormat
740                    file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
741                    location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
742                    name default.bucketmapjoin_tmp_result
743                    numFiles 1
744                    numPartitions 0
745                    numRows 564
746                    rawDataSize 10503
747                    serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
748                    serialization.format 1
749                    serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
750                    totalSize 11067
751                    transient_lastDdlTime 1306979195
752                  serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
753                  name: default.bucketmapjoin_tmp_result
754              TotalFiles: 1
755              GatherStats: false
756              MultiFileSpray: false
757      Needs Tagging: false
758      Path -> Alias:
759        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002]
760      Path -> Partition:
761        pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002 
762          Partition
763            base file name: -ext-10002
764            input format: org.apache.hadoop.mapred.TextInputFormat
765            output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
766            properties:
767              bucket_count -1
768              columns key,value1,value2
769              columns.types string:string:string
770              file.inputformat org.apache.hadoop.mapred.TextInputFormat
771              file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
772              location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_r…

Large files files are truncated, but you can click here to view the full file