PageRenderTime 57ms CodeModel.GetById 18ms RepoModel.GetById 1ms app.codeStats 0ms

/tags/release-0.2.0-rc0/hive/external/ql/src/test/results/clientpositive/bucketmapjoin3.q.out

#
text | 1031 lines | 1007 code | 24 blank | 0 comment | 0 complexity | f51fdcb56bf6cbad98bc2dd47d4c0869 MD5 | raw file
Possible License(s): Apache-2.0, BSD-3-Clause, JSON, CPL-1.0

Large files files are truncated, but you can click here to view the full file

  1. PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  2. PREHOOK: type: CREATETABLE
  3. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  4. POSTHOOK: type: CREATETABLE
  5. POSTHOOK: Output: default@srcbucket_mapjoin
  6. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  7. PREHOOK: type: LOAD
  8. PREHOOK: Output: default@srcbucket_mapjoin
  9. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  10. POSTHOOK: type: LOAD
  11. POSTHOOK: Output: default@srcbucket_mapjoin
  12. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  13. PREHOOK: type: LOAD
  14. PREHOOK: Output: default@srcbucket_mapjoin
  15. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  16. POSTHOOK: type: LOAD
  17. POSTHOOK: Output: default@srcbucket_mapjoin
  18. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  19. PREHOOK: type: CREATETABLE
  20. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  21. POSTHOOK: type: CREATETABLE
  22. POSTHOOK: Output: default@srcbucket_mapjoin_part
  23. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  24. PREHOOK: type: LOAD
  25. PREHOOK: Output: default@srcbucket_mapjoin_part
  26. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  27. POSTHOOK: type: LOAD
  28. POSTHOOK: Output: default@srcbucket_mapjoin_part
  29. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  30. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  31. PREHOOK: type: LOAD
  32. PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  33. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  34. POSTHOOK: type: LOAD
  35. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  36. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  37. PREHOOK: type: LOAD
  38. PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  39. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  40. POSTHOOK: type: LOAD
  41. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  42. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  43. PREHOOK: type: LOAD
  44. PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  45. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  46. POSTHOOK: type: LOAD
  47. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  48. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  49. PREHOOK: type: CREATETABLE
  50. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  51. POSTHOOK: type: CREATETABLE
  52. POSTHOOK: Output: default@srcbucket_mapjoin_part_2
  53. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  54. PREHOOK: type: LOAD
  55. PREHOOK: Output: default@srcbucket_mapjoin_part_2
  56. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  57. POSTHOOK: type: LOAD
  58. POSTHOOK: Output: default@srcbucket_mapjoin_part_2
  59. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  60. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  61. PREHOOK: type: LOAD
  62. PREHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  63. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  64. POSTHOOK: type: LOAD
  65. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  66. PREHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  67. PREHOOK: type: CREATETABLE
  68. POSTHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  69. POSTHOOK: type: CREATETABLE
  70. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  71. PREHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  72. PREHOOK: type: CREATETABLE
  73. POSTHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  74. POSTHOOK: type: CREATETABLE
  75. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  76. PREHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  77. PREHOOK: type: CREATETABLE
  78. POSTHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  79. POSTHOOK: type: CREATETABLE
  80. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  81. PREHOOK: query: explain extended
  82. insert overwrite table bucketmapjoin_tmp_result
  83. select /*+mapjoin(b)*/ a.key, a.value, b.value
  84. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  85. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  86. PREHOOK: type: QUERY
  87. POSTHOOK: query: explain extended
  88. insert overwrite table bucketmapjoin_tmp_result
  89. select /*+mapjoin(b)*/ a.key, a.value, b.value
  90. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  91. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  92. POSTHOOK: type: QUERY
  93. ABSTRACT SYNTAX TREE:
  94. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part_2) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (and (and (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)) (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08")) (= (. (TOK_TABLE_OR_COL a) ds) "2008-04-08")))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST b))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
  95. STAGE DEPENDENCIES:
  96. Stage-7 is a root stage
  97. Stage-1 depends on stages: Stage-7
  98. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  99. Stage-4
  100. Stage-0 depends on stages: Stage-4, Stage-3
  101. Stage-2 depends on stages: Stage-0
  102. Stage-3
  103. STAGE PLANS:
  104. Stage: Stage-7
  105. Map Reduce Local Work
  106. Alias -> Map Local Tables:
  107. b
  108. Fetch Operator
  109. limit: -1
  110. Alias -> Map Local Operator Tree:
  111. b
  112. TableScan
  113. alias: b
  114. GatherStats: false
  115. HashTable Sink Operator
  116. condition expressions:
  117. 0 {key} {value}
  118. 1 {value}
  119. handleSkewJoin: false
  120. keys:
  121. 0 [Column[key]]
  122. 1 [Column[key]]
  123. Position of Big Table: 0
  124. Bucket Mapjoin Context:
  125. Alias Bucket Base File Name Mapping:
  126. b {srcbucket22.txt=[srcbucket20.txt, srcbucket22.txt], srcbucket23.txt=[srcbucket21.txt, srcbucket23.txt]}
  127. Alias Bucket File Name Mapping:
  128. b {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt, pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt, pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt]}
  129. Alias Bucket Output File Name Mapping:
  130. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt 0
  131. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt 1
  132. Stage: Stage-1
  133. Map Reduce
  134. Alias -> Map Operator Tree:
  135. a
  136. TableScan
  137. alias: a
  138. GatherStats: false
  139. Map Join Operator
  140. condition map:
  141. Inner Join 0 to 1
  142. condition expressions:
  143. 0 {key} {value}
  144. 1 {value}
  145. handleSkewJoin: false
  146. keys:
  147. 0 [Column[key]]
  148. 1 [Column[key]]
  149. outputColumnNames: _col0, _col1, _col6
  150. Position of Big Table: 0
  151. Select Operator
  152. expressions:
  153. expr: _col0
  154. type: int
  155. expr: _col1
  156. type: string
  157. expr: _col6
  158. type: string
  159. outputColumnNames: _col0, _col1, _col6
  160. Select Operator
  161. expressions:
  162. expr: _col0
  163. type: int
  164. expr: _col1
  165. type: string
  166. expr: _col6
  167. type: string
  168. outputColumnNames: _col0, _col1, _col2
  169. File Output Operator
  170. compressed: false
  171. GlobalTableId: 1
  172. directory: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-34-40_179_2078859592920140854/-ext-10002
  173. NumFilesPerFileSink: 1
  174. Stats Publishing Key Prefix: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-34-40_179_2078859592920140854/-ext-10000/
  175. table:
  176. input format: org.apache.hadoop.mapred.TextInputFormat
  177. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  178. properties:
  179. bucket_count -1
  180. columns key,value1,value2
  181. columns.types string:string:string
  182. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  183. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  184. location pfile:/home/amarsri/workspace/hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  185. name default.bucketmapjoin_tmp_result
  186. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  187. serialization.format 1
  188. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  189. transient_lastDdlTime 1310373280
  190. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  191. name: default.bucketmapjoin_tmp_result
  192. TotalFiles: 1
  193. GatherStats: true
  194. MultiFileSpray: false
  195. Local Work:
  196. Map Reduce Local Work
  197. Needs Tagging: false
  198. Path -> Alias:
  199. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08 [a]
  200. Path -> Partition:
  201. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08
  202. Partition
  203. base file name: ds=2008-04-08
  204. input format: org.apache.hadoop.mapred.TextInputFormat
  205. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  206. partition values:
  207. ds 2008-04-08
  208. properties:
  209. bucket_count 2
  210. bucket_field_name key
  211. columns key,value
  212. columns.types int:string
  213. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  214. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  215. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08
  216. name default.srcbucket_mapjoin_part_2
  217. partition_columns ds
  218. serialization.ddl struct srcbucket_mapjoin_part_2 { i32 key, string value}
  219. serialization.format 1
  220. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  221. transient_lastDdlTime 1306979174
  222. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  223. input format: org.apache.hadoop.mapred.TextInputFormat
  224. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  225. properties:
  226. bucket_count 2
  227. bucket_field_name key
  228. columns key,value
  229. columns.types int:string
  230. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  231. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  232. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2
  233. name default.srcbucket_mapjoin_part_2
  234. partition_columns ds
  235. serialization.ddl struct srcbucket_mapjoin_part_2 { i32 key, string value}
  236. serialization.format 1
  237. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  238. transient_lastDdlTime 1306979173
  239. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  240. name: default.srcbucket_mapjoin_part_2
  241. name: default.srcbucket_mapjoin_part_2
  242. Stage: Stage-5
  243. Conditional Operator
  244. Stage: Stage-4
  245. Move Operator
  246. files:
  247. hdfs directory: true
  248. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002
  249. destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000
  250. Stage: Stage-0
  251. Move Operator
  252. tables:
  253. replace: true
  254. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000
  255. table:
  256. input format: org.apache.hadoop.mapred.TextInputFormat
  257. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  258. properties:
  259. bucket_count -1
  260. columns key,value1,value2
  261. columns.types string:string:string
  262. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  263. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  264. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  265. name default.bucketmapjoin_tmp_result
  266. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  267. serialization.format 1
  268. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  269. transient_lastDdlTime 1306979174
  270. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  271. name: default.bucketmapjoin_tmp_result
  272. tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10001
  273. Stage: Stage-2
  274. Stats-Aggr Operator
  275. Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000/
  276. Stage: Stage-3
  277. Map Reduce
  278. Alias -> Map Operator Tree:
  279. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002
  280. File Output Operator
  281. compressed: false
  282. GlobalTableId: 0
  283. directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10000
  284. NumFilesPerFileSink: 1
  285. table:
  286. input format: org.apache.hadoop.mapred.TextInputFormat
  287. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  288. properties:
  289. bucket_count -1
  290. columns key,value1,value2
  291. columns.types string:string:string
  292. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  293. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  294. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  295. name default.bucketmapjoin_tmp_result
  296. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  297. serialization.format 1
  298. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  299. transient_lastDdlTime 1306979174
  300. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  301. name: default.bucketmapjoin_tmp_result
  302. TotalFiles: 1
  303. GatherStats: false
  304. MultiFileSpray: false
  305. Needs Tagging: false
  306. Path -> Alias:
  307. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002]
  308. Path -> Partition:
  309. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-14_989_6212335898656818660/-ext-10002
  310. Partition
  311. base file name: -ext-10002
  312. input format: org.apache.hadoop.mapred.TextInputFormat
  313. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  314. properties:
  315. bucket_count -1
  316. columns key,value1,value2
  317. columns.types string:string:string
  318. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  319. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  320. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  321. name default.bucketmapjoin_tmp_result
  322. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  323. serialization.format 1
  324. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  325. transient_lastDdlTime 1306979174
  326. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  327. input format: org.apache.hadoop.mapred.TextInputFormat
  328. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  329. properties:
  330. bucket_count -1
  331. columns key,value1,value2
  332. columns.types string:string:string
  333. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  334. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  335. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  336. name default.bucketmapjoin_tmp_result
  337. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  338. serialization.format 1
  339. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  340. transient_lastDdlTime 1306979174
  341. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  342. name: default.bucketmapjoin_tmp_result
  343. name: default.bucketmapjoin_tmp_result
  344. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  345. select /*+mapjoin(b)*/ a.key, a.value, b.value
  346. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  347. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  348. PREHOOK: type: QUERY
  349. PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  350. PREHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  351. PREHOOK: Output: default@bucketmapjoin_tmp_result
  352. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  353. select /*+mapjoin(b)*/ a.key, a.value, b.value
  354. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  355. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  356. POSTHOOK: type: QUERY
  357. POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  358. POSTHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  359. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  360. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  361. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  362. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  363. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  364. PREHOOK: type: QUERY
  365. PREHOOK: Input: default@bucketmapjoin_tmp_result
  366. PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-21_973_1112542633479425376/-mr-10000
  367. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  368. POSTHOOK: type: QUERY
  369. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  370. POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-21_973_1112542633479425376/-mr-10000
  371. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  372. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  373. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  374. 564
  375. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  376. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  377. PREHOOK: type: QUERY
  378. PREHOOK: Input: default@bucketmapjoin_tmp_result
  379. PREHOOK: Output: default@bucketmapjoin_hash_result_1
  380. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  381. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  382. POSTHOOK: type: QUERY
  383. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  384. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  385. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  386. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  387. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  388. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  389. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  390. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  391. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  392. select /*+mapjoin(b)*/ a.key, a.value, b.value
  393. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  394. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  395. PREHOOK: type: QUERY
  396. PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  397. PREHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  398. PREHOOK: Output: default@bucketmapjoin_tmp_result
  399. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  400. select /*+mapjoin(b)*/ a.key, a.value, b.value
  401. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  402. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  403. POSTHOOK: type: QUERY
  404. POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  405. POSTHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  406. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  407. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  408. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  409. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  410. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  411. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  412. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  413. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  414. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  415. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  416. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  417. PREHOOK: type: QUERY
  418. PREHOOK: Input: default@bucketmapjoin_tmp_result
  419. PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-35_394_5427265786129780250/-mr-10000
  420. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  421. POSTHOOK: type: QUERY
  422. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  423. POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-35_394_5427265786129780250/-mr-10000
  424. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  425. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  426. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  427. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  428. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  429. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  430. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  431. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  432. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  433. 564
  434. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  435. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  436. PREHOOK: type: QUERY
  437. PREHOOK: Input: default@bucketmapjoin_tmp_result
  438. PREHOOK: Output: default@bucketmapjoin_hash_result_2
  439. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  440. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  441. POSTHOOK: type: QUERY
  442. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  443. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  444. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  445. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  446. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  447. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  448. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  449. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  450. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  451. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  452. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  453. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  454. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  455. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  456. PREHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  457. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  458. on a.key = b.key
  459. PREHOOK: type: QUERY
  460. PREHOOK: Input: default@bucketmapjoin_hash_result_1
  461. PREHOOK: Input: default@bucketmapjoin_hash_result_2
  462. PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-42_543_1855526648690468691/-mr-10000
  463. POSTHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  464. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  465. on a.key = b.key
  466. POSTHOOK: type: QUERY
  467. POSTHOOK: Input: default@bucketmapjoin_hash_result_1
  468. POSTHOOK: Input: default@bucketmapjoin_hash_result_2
  469. POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-46-42_543_1855526648690468691/-mr-10000
  470. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  471. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  472. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  473. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  474. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  475. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  476. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  477. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  478. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  479. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  480. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  481. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  482. 0 0 0
  483. PREHOOK: query: explain extended
  484. insert overwrite table bucketmapjoin_tmp_result
  485. select /*+mapjoin(a)*/ a.key, a.value, b.value
  486. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  487. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  488. PREHOOK: type: QUERY
  489. POSTHOOK: query: explain extended
  490. insert overwrite table bucketmapjoin_tmp_result
  491. select /*+mapjoin(a)*/ a.key, a.value, b.value
  492. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  493. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  494. POSTHOOK: type: QUERY
  495. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  496. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  497. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  498. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  499. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  500. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  501. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  502. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  503. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  504. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  505. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  506. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  507. ABSTRACT SYNTAX TREE:
  508. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part_2) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (and (and (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)) (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08")) (= (. (TOK_TABLE_OR_COL a) ds) "2008-04-08")))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST a))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
  509. STAGE DEPENDENCIES:
  510. Stage-7 is a root stage
  511. Stage-1 depends on stages: Stage-7
  512. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  513. Stage-4
  514. Stage-0 depends on stages: Stage-4, Stage-3
  515. Stage-2 depends on stages: Stage-0
  516. Stage-3
  517. STAGE PLANS:
  518. Stage: Stage-7
  519. Map Reduce Local Work
  520. Alias -> Map Local Tables:
  521. a
  522. Fetch Operator
  523. limit: -1
  524. Alias -> Map Local Operator Tree:
  525. a
  526. TableScan
  527. alias: a
  528. GatherStats: false
  529. HashTable Sink Operator
  530. condition expressions:
  531. 0 {key} {value}
  532. 1 {value}
  533. handleSkewJoin: false
  534. keys:
  535. 0 [Column[key]]
  536. 1 [Column[key]]
  537. Position of Big Table: 1
  538. Bucket Mapjoin Context:
  539. Alias Bucket Base File Name Mapping:
  540. a {srcbucket20.txt=[srcbucket22.txt], srcbucket21.txt=[srcbucket23.txt], srcbucket22.txt=[srcbucket22.txt], srcbucket23.txt=[srcbucket23.txt]}
  541. Alias Bucket File Name Mapping:
  542. a {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt]}
  543. Alias Bucket Output File Name Mapping:
  544. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt 0
  545. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt 1
  546. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt 2
  547. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt 3
  548. Stage: Stage-1
  549. Map Reduce
  550. Alias -> Map Operator Tree:
  551. b
  552. TableScan
  553. alias: b
  554. GatherStats: false
  555. Map Join Operator
  556. condition map:
  557. Inner Join 0 to 1
  558. condition expressions:
  559. 0 {key} {value}
  560. 1 {value}
  561. handleSkewJoin: false
  562. keys:
  563. 0 [Column[key]]
  564. 1 [Column[key]]
  565. outputColumnNames: _col0, _col1, _col6
  566. Position of Big Table: 1
  567. Select Operator
  568. expressions:
  569. expr: _col0
  570. type: int
  571. expr: _col1
  572. type: string
  573. expr: _col6
  574. type: string
  575. outputColumnNames: _col0, _col1, _col6
  576. Select Operator
  577. expressions:
  578. expr: _col0
  579. type: int
  580. expr: _col1
  581. type: string
  582. expr: _col6
  583. type: string
  584. outputColumnNames: _col0, _col1, _col2
  585. File Output Operator
  586. compressed: false
  587. GlobalTableId: 1
  588. directory: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-35-06_760_1506759328569853293/-ext-10002
  589. NumFilesPerFileSink: 1
  590. Stats Publishing Key Prefix: pfile:/home/amarsri/workspace/hive/build/ql/scratchdir/hive_2011-07-11_01-35-06_760_1506759328569853293/-ext-10000/
  591. table:
  592. input format: org.apache.hadoop.mapred.TextInputFormat
  593. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  594. properties:
  595. bucket_count -1
  596. columns key,value1,value2
  597. columns.types string:string:string
  598. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  599. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  600. location pfile:/home/amarsri/workspace/hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  601. name default.bucketmapjoin_tmp_result
  602. numFiles 1
  603. numPartitions 0
  604. numRows 564
  605. rawDataSize 10503
  606. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  607. serialization.format 1
  608. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  609. totalSize 11067
  610. transient_lastDdlTime 1310373297
  611. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  612. name: default.bucketmapjoin_tmp_result
  613. TotalFiles: 1
  614. GatherStats: true
  615. MultiFileSpray: false
  616. Local Work:
  617. Map Reduce Local Work
  618. Needs Tagging: false
  619. Path -> Alias:
  620. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08 [b]
  621. Path -> Partition:
  622. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08
  623. Partition
  624. base file name: ds=2008-04-08
  625. input format: org.apache.hadoop.mapred.TextInputFormat
  626. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  627. partition values:
  628. ds 2008-04-08
  629. properties:
  630. bucket_count 4
  631. bucket_field_name key
  632. columns key,value
  633. columns.types int:string
  634. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  635. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  636. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08
  637. name default.srcbucket_mapjoin_part
  638. partition_columns ds
  639. serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
  640. serialization.format 1
  641. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  642. transient_lastDdlTime 1306979173
  643. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  644. input format: org.apache.hadoop.mapred.TextInputFormat
  645. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  646. properties:
  647. bucket_count 4
  648. bucket_field_name key
  649. columns key,value
  650. columns.types int:string
  651. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  652. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  653. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin_part
  654. name default.srcbucket_mapjoin_part
  655. partition_columns ds
  656. serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
  657. serialization.format 1
  658. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  659. transient_lastDdlTime 1306979170
  660. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  661. name: default.srcbucket_mapjoin_part
  662. name: default.srcbucket_mapjoin_part
  663. Stage: Stage-5
  664. Conditional Operator
  665. Stage: Stage-4
  666. Move Operator
  667. files:
  668. hdfs directory: true
  669. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002
  670. destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000
  671. Stage: Stage-0
  672. Move Operator
  673. tables:
  674. replace: true
  675. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000
  676. table:
  677. input format: org.apache.hadoop.mapred.TextInputFormat
  678. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  679. properties:
  680. bucket_count -1
  681. columns key,value1,value2
  682. columns.types string:string:string
  683. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  684. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  685. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  686. name default.bucketmapjoin_tmp_result
  687. numFiles 1
  688. numPartitions 0
  689. numRows 564
  690. rawDataSize 10503
  691. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  692. serialization.format 1
  693. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  694. totalSize 11067
  695. transient_lastDdlTime 1306979195
  696. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  697. name: default.bucketmapjoin_tmp_result
  698. tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10001
  699. Stage: Stage-2
  700. Stats-Aggr Operator
  701. Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000/
  702. Stage: Stage-3
  703. Map Reduce
  704. Alias -> Map Operator Tree:
  705. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002
  706. File Output Operator
  707. compressed: false
  708. GlobalTableId: 0
  709. directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10000
  710. NumFilesPerFileSink: 1
  711. table:
  712. input format: org.apache.hadoop.mapred.TextInputFormat
  713. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  714. properties:
  715. bucket_count -1
  716. columns key,value1,value2
  717. columns.types string:string:string
  718. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  719. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  720. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  721. name default.bucketmapjoin_tmp_result
  722. numFiles 1
  723. numPartitions 0
  724. numRows 564
  725. rawDataSize 10503
  726. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  727. serialization.format 1
  728. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  729. totalSize 11067
  730. transient_lastDdlTime 1306979195
  731. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  732. name: default.bucketmapjoin_tmp_result
  733. TotalFiles: 1
  734. GatherStats: false
  735. MultiFileSpray: false
  736. Needs Tagging: false
  737. Path -> Alias:
  738. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002]
  739. Path -> Partition:
  740. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-46-45_810_5134529884228638664/-ext-10002
  741. Partition
  742. base file name: -ext-10002
  743. input format: org.apache.hadoop.mapred.TextInputFormat
  744. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  745. properties:
  746. bucket_count -1
  747. columns key,value1,value2
  748. columns.types string:string:string
  749. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  750. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  751. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_r

Large files files are truncated, but you can click here to view the full file