PageRenderTime 37ms CodeModel.GetById 4ms RepoModel.GetById 0ms app.codeStats 0ms

/tags/release-0.0.0-rc0/hive/external/ql/src/test/results/clientpositive/bucketmapjoin3.q.out

#
text | 1036 lines | 1012 code | 24 blank | 0 comment | 0 complexity | 9f08679dcfd99b8516dbeea59df69843 MD5 | raw file
Possible License(s): Apache-2.0, BSD-3-Clause, JSON, CPL-1.0

Large files files are truncated, but you can click here to view the full file

  1. PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  2. PREHOOK: type: CREATETABLE
  3. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  4. POSTHOOK: type: CREATETABLE
  5. POSTHOOK: Output: default@srcbucket_mapjoin
  6. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  7. PREHOOK: type: LOAD
  8. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  9. POSTHOOK: type: LOAD
  10. POSTHOOK: Output: default@srcbucket_mapjoin
  11. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  12. PREHOOK: type: LOAD
  13. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  14. POSTHOOK: type: LOAD
  15. POSTHOOK: Output: default@srcbucket_mapjoin
  16. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  17. PREHOOK: type: CREATETABLE
  18. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  19. POSTHOOK: type: CREATETABLE
  20. POSTHOOK: Output: default@srcbucket_mapjoin_part
  21. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  22. PREHOOK: type: LOAD
  23. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  24. POSTHOOK: type: LOAD
  25. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  26. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  27. PREHOOK: type: LOAD
  28. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  29. POSTHOOK: type: LOAD
  30. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  31. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  32. PREHOOK: type: LOAD
  33. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  34. POSTHOOK: type: LOAD
  35. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  36. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  37. PREHOOK: type: LOAD
  38. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  39. POSTHOOK: type: LOAD
  40. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  41. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  42. PREHOOK: type: CREATETABLE
  43. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  44. POSTHOOK: type: CREATETABLE
  45. POSTHOOK: Output: default@srcbucket_mapjoin_part_2
  46. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  47. PREHOOK: type: LOAD
  48. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  49. POSTHOOK: type: LOAD
  50. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  51. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  52. PREHOOK: type: LOAD
  53. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  54. POSTHOOK: type: LOAD
  55. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  56. PREHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  57. PREHOOK: type: CREATETABLE
  58. POSTHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  59. POSTHOOK: type: CREATETABLE
  60. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  61. PREHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  62. PREHOOK: type: CREATETABLE
  63. POSTHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  64. POSTHOOK: type: CREATETABLE
  65. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  66. PREHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  67. PREHOOK: type: CREATETABLE
  68. POSTHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  69. POSTHOOK: type: CREATETABLE
  70. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  71. PREHOOK: query: explain extended
  72. insert overwrite table bucketmapjoin_tmp_result
  73. select /*+mapjoin(b)*/ a.key, a.value, b.value
  74. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  75. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  76. PREHOOK: type: QUERY
  77. POSTHOOK: query: explain extended
  78. insert overwrite table bucketmapjoin_tmp_result
  79. select /*+mapjoin(b)*/ a.key, a.value, b.value
  80. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  81. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  82. POSTHOOK: type: QUERY
  83. ABSTRACT SYNTAX TREE:
  84. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part_2) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (and (and (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)) (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08")) (= (. (TOK_TABLE_OR_COL a) ds) "2008-04-08")))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST b))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
  85. STAGE DEPENDENCIES:
  86. Stage-7 is a root stage
  87. Stage-1 depends on stages: Stage-7
  88. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  89. Stage-4
  90. Stage-0 depends on stages: Stage-4, Stage-3
  91. Stage-2 depends on stages: Stage-0
  92. Stage-3
  93. STAGE PLANS:
  94. Stage: Stage-7
  95. Map Reduce Local Work
  96. Alias -> Map Local Tables:
  97. b
  98. Fetch Operator
  99. limit: -1
  100. Alias -> Map Local Operator Tree:
  101. b
  102. TableScan
  103. alias: b
  104. GatherStats: false
  105. Filter Operator
  106. isSamplingPred: false
  107. predicate:
  108. expr: (ds = '2008-04-08')
  109. type: boolean
  110. HashTable Sink Operator
  111. condition expressions:
  112. 0 {key} {value}
  113. 1 {value}
  114. handleSkewJoin: false
  115. keys:
  116. 0 [Column[key]]
  117. 1 [Column[key]]
  118. Position of Big Table: 0
  119. Bucket Mapjoin Context:
  120. Alias Bucket Base File Name Mapping:
  121. b {srcbucket22.txt=[srcbucket20.txt, srcbucket22.txt], srcbucket23.txt=[srcbucket21.txt, srcbucket23.txt]}
  122. Alias Bucket File Name Mapping:
  123. b {pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt, pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt, pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt]}
  124. Alias Bucket Output File Name Mapping:
  125. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt 0
  126. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt 1
  127. Stage: Stage-1
  128. Map Reduce
  129. Alias -> Map Operator Tree:
  130. a
  131. TableScan
  132. alias: a
  133. GatherStats: false
  134. Filter Operator
  135. isSamplingPred: false
  136. predicate:
  137. expr: (ds = '2008-04-08')
  138. type: boolean
  139. Map Join Operator
  140. condition map:
  141. Inner Join 0 to 1
  142. condition expressions:
  143. 0 {key} {value}
  144. 1 {value}
  145. handleSkewJoin: false
  146. keys:
  147. 0 [Column[key]]
  148. 1 [Column[key]]
  149. outputColumnNames: _col0, _col1, _col6
  150. Position of Big Table: 0
  151. Select Operator
  152. expressions:
  153. expr: _col0
  154. type: int
  155. expr: _col1
  156. type: string
  157. expr: _col6
  158. type: string
  159. outputColumnNames: _col0, _col1, _col6
  160. Select Operator
  161. expressions:
  162. expr: _col0
  163. type: int
  164. expr: _col1
  165. type: string
  166. expr: _col6
  167. type: string
  168. outputColumnNames: _col0, _col1, _col2
  169. File Output Operator
  170. compressed: false
  171. GlobalTableId: 1
  172. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10002
  173. NumFilesPerFileSink: 1
  174. Stats Publishing Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10000/
  175. table:
  176. input format: org.apache.hadoop.mapred.TextInputFormat
  177. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  178. properties:
  179. bucket_count -1
  180. columns key,value1,value2
  181. columns.types string:string:string
  182. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  183. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  184. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  185. name default.bucketmapjoin_tmp_result
  186. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  187. serialization.format 1
  188. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  189. transient_lastDdlTime 1297330484
  190. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  191. name: default.bucketmapjoin_tmp_result
  192. TotalFiles: 1
  193. GatherStats: true
  194. MultiFileSpray: false
  195. Local Work:
  196. Map Reduce Local Work
  197. Needs Tagging: false
  198. Path -> Alias:
  199. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08 [a]
  200. Path -> Partition:
  201. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08
  202. Partition
  203. base file name: ds=2008-04-08
  204. input format: org.apache.hadoop.mapred.TextInputFormat
  205. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  206. partition values:
  207. ds 2008-04-08
  208. properties:
  209. bucket_count 2
  210. bucket_field_name key
  211. columns key,value
  212. columns.types int:string
  213. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  214. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  215. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08
  216. name default.srcbucket_mapjoin_part_2
  217. partition_columns ds
  218. serialization.ddl struct srcbucket_mapjoin_part_2 { i32 key, string value}
  219. serialization.format 1
  220. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  221. transient_lastDdlTime 1297330482
  222. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  223. input format: org.apache.hadoop.mapred.TextInputFormat
  224. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  225. properties:
  226. bucket_count 2
  227. bucket_field_name key
  228. columns key,value
  229. columns.types int:string
  230. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  231. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  232. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2
  233. name default.srcbucket_mapjoin_part_2
  234. partition_columns ds
  235. serialization.ddl struct srcbucket_mapjoin_part_2 { i32 key, string value}
  236. serialization.format 1
  237. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  238. transient_lastDdlTime 1297330482
  239. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  240. name: default.srcbucket_mapjoin_part_2
  241. name: default.srcbucket_mapjoin_part_2
  242. Stage: Stage-5
  243. Conditional Operator
  244. Stage: Stage-4
  245. Move Operator
  246. files:
  247. hdfs directory: true
  248. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10002
  249. destination: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10000
  250. Stage: Stage-0
  251. Move Operator
  252. tables:
  253. replace: true
  254. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10000
  255. table:
  256. input format: org.apache.hadoop.mapred.TextInputFormat
  257. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  258. properties:
  259. bucket_count -1
  260. columns key,value1,value2
  261. columns.types string:string:string
  262. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  263. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  264. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  265. name default.bucketmapjoin_tmp_result
  266. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  267. serialization.format 1
  268. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  269. transient_lastDdlTime 1297330484
  270. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  271. name: default.bucketmapjoin_tmp_result
  272. tmp directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10001
  273. Stage: Stage-2
  274. Stats-Aggr Operator
  275. Stats Aggregation Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10000/
  276. Stage: Stage-3
  277. Map Reduce
  278. Alias -> Map Operator Tree:
  279. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10002
  280. File Output Operator
  281. compressed: false
  282. GlobalTableId: 0
  283. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10000
  284. NumFilesPerFileSink: 1
  285. table:
  286. input format: org.apache.hadoop.mapred.TextInputFormat
  287. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  288. properties:
  289. bucket_count -1
  290. columns key,value1,value2
  291. columns.types string:string:string
  292. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  293. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  294. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  295. name default.bucketmapjoin_tmp_result
  296. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  297. serialization.format 1
  298. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  299. transient_lastDdlTime 1297330484
  300. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  301. name: default.bucketmapjoin_tmp_result
  302. TotalFiles: 1
  303. GatherStats: false
  304. MultiFileSpray: false
  305. Needs Tagging: false
  306. Path -> Alias:
  307. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10002 [pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10002]
  308. Path -> Partition:
  309. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-34-44_204_2973712557284504853/-ext-10002
  310. Partition
  311. base file name: -ext-10002
  312. input format: org.apache.hadoop.mapred.TextInputFormat
  313. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  314. properties:
  315. bucket_count -1
  316. columns key,value1,value2
  317. columns.types string:string:string
  318. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  319. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  320. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  321. name default.bucketmapjoin_tmp_result
  322. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  323. serialization.format 1
  324. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  325. transient_lastDdlTime 1297330484
  326. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  327. input format: org.apache.hadoop.mapred.TextInputFormat
  328. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  329. properties:
  330. bucket_count -1
  331. columns key,value1,value2
  332. columns.types string:string:string
  333. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  334. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  335. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  336. name default.bucketmapjoin_tmp_result
  337. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  338. serialization.format 1
  339. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  340. transient_lastDdlTime 1297330484
  341. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  342. name: default.bucketmapjoin_tmp_result
  343. name: default.bucketmapjoin_tmp_result
  344. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  345. select /*+mapjoin(b)*/ a.key, a.value, b.value
  346. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  347. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  348. PREHOOK: type: QUERY
  349. PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  350. PREHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  351. PREHOOK: Output: default@bucketmapjoin_tmp_result
  352. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  353. select /*+mapjoin(b)*/ a.key, a.value, b.value
  354. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  355. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  356. POSTHOOK: type: QUERY
  357. POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  358. POSTHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  359. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  360. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  361. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  362. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  363. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  364. PREHOOK: type: QUERY
  365. PREHOOK: Input: default@bucketmapjoin_tmp_result
  366. PREHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-34-51_895_77836889145379095/-mr-10000
  367. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  368. POSTHOOK: type: QUERY
  369. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  370. POSTHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-34-51_895_77836889145379095/-mr-10000
  371. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  372. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  373. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  374. 564
  375. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  376. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  377. PREHOOK: type: QUERY
  378. PREHOOK: Input: default@bucketmapjoin_tmp_result
  379. PREHOOK: Output: default@bucketmapjoin_hash_result_1
  380. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  381. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  382. POSTHOOK: type: QUERY
  383. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  384. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  385. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  386. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  387. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  388. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  389. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  390. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  391. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  392. select /*+mapjoin(b)*/ a.key, a.value, b.value
  393. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  394. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  395. PREHOOK: type: QUERY
  396. PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  397. PREHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  398. PREHOOK: Output: default@bucketmapjoin_tmp_result
  399. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  400. select /*+mapjoin(b)*/ a.key, a.value, b.value
  401. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  402. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  403. POSTHOOK: type: QUERY
  404. POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  405. POSTHOOK: Input: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  406. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  407. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  408. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  409. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  410. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  411. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  412. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  413. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  414. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  415. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  416. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  417. PREHOOK: type: QUERY
  418. PREHOOK: Input: default@bucketmapjoin_tmp_result
  419. PREHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-35-06_716_6528981748204813247/-mr-10000
  420. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  421. POSTHOOK: type: QUERY
  422. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  423. POSTHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-35-06_716_6528981748204813247/-mr-10000
  424. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  425. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  426. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  427. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  428. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  429. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  430. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  431. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  432. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  433. 564
  434. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  435. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  436. PREHOOK: type: QUERY
  437. PREHOOK: Input: default@bucketmapjoin_tmp_result
  438. PREHOOK: Output: default@bucketmapjoin_hash_result_2
  439. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  440. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  441. POSTHOOK: type: QUERY
  442. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  443. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  444. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  445. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  446. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  447. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  448. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  449. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  450. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  451. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  452. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  453. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  454. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  455. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  456. PREHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  457. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  458. on a.key = b.key
  459. PREHOOK: type: QUERY
  460. PREHOOK: Input: default@bucketmapjoin_hash_result_1
  461. PREHOOK: Input: default@bucketmapjoin_hash_result_2
  462. PREHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-35-14_628_984622570724825210/-mr-10000
  463. POSTHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  464. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  465. on a.key = b.key
  466. POSTHOOK: type: QUERY
  467. POSTHOOK: Input: default@bucketmapjoin_hash_result_1
  468. POSTHOOK: Input: default@bucketmapjoin_hash_result_2
  469. POSTHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-35-14_628_984622570724825210/-mr-10000
  470. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  471. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  472. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  473. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  474. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  475. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  476. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  477. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  478. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  479. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  480. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  481. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  482. 0 0 0
  483. PREHOOK: query: explain extended
  484. insert overwrite table bucketmapjoin_tmp_result
  485. select /*+mapjoin(a)*/ a.key, a.value, b.value
  486. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  487. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  488. PREHOOK: type: QUERY
  489. POSTHOOK: query: explain extended
  490. insert overwrite table bucketmapjoin_tmp_result
  491. select /*+mapjoin(a)*/ a.key, a.value, b.value
  492. from srcbucket_mapjoin_part_2 a join srcbucket_mapjoin_part b
  493. on a.key=b.key and b.ds="2008-04-08" and a.ds="2008-04-08"
  494. POSTHOOK: type: QUERY
  495. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  496. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  497. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  498. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  499. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  500. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  501. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  502. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:key, type:int, comment:null), ]
  503. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  504. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin_part_2)a.FieldSchema(name:value, type:string, comment:null), ]
  505. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  506. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  507. ABSTRACT SYNTAX TREE:
  508. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part_2) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (and (and (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)) (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08")) (= (. (TOK_TABLE_OR_COL a) ds) "2008-04-08")))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST a))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
  509. STAGE DEPENDENCIES:
  510. Stage-7 is a root stage
  511. Stage-1 depends on stages: Stage-7
  512. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  513. Stage-4
  514. Stage-0 depends on stages: Stage-4, Stage-3
  515. Stage-2 depends on stages: Stage-0
  516. Stage-3
  517. STAGE PLANS:
  518. Stage: Stage-7
  519. Map Reduce Local Work
  520. Alias -> Map Local Tables:
  521. a
  522. Fetch Operator
  523. limit: -1
  524. Alias -> Map Local Operator Tree:
  525. a
  526. TableScan
  527. alias: a
  528. GatherStats: false
  529. Filter Operator
  530. isSamplingPred: false
  531. predicate:
  532. expr: (ds = '2008-04-08')
  533. type: boolean
  534. HashTable Sink Operator
  535. condition expressions:
  536. 0 {key} {value}
  537. 1 {value}
  538. handleSkewJoin: false
  539. keys:
  540. 0 [Column[key]]
  541. 1 [Column[key]]
  542. Position of Big Table: 1
  543. Bucket Mapjoin Context:
  544. Alias Bucket Base File Name Mapping:
  545. a {srcbucket20.txt=[srcbucket22.txt], srcbucket21.txt=[srcbucket23.txt], srcbucket22.txt=[srcbucket22.txt], srcbucket23.txt=[srcbucket23.txt]}
  546. Alias Bucket File Name Mapping:
  547. a {pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part_2/ds=2008-04-08/srcbucket23.txt]}
  548. Alias Bucket Output File Name Mapping:
  549. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt 0
  550. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt 1
  551. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt 2
  552. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt 3
  553. Stage: Stage-1
  554. Map Reduce
  555. Alias -> Map Operator Tree:
  556. b
  557. TableScan
  558. alias: b
  559. GatherStats: false
  560. Filter Operator
  561. isSamplingPred: false
  562. predicate:
  563. expr: (ds = '2008-04-08')
  564. type: boolean
  565. Map Join Operator
  566. condition map:
  567. Inner Join 0 to 1
  568. condition expressions:
  569. 0 {key} {value}
  570. 1 {value}
  571. handleSkewJoin: false
  572. keys:
  573. 0 [Column[key]]
  574. 1 [Column[key]]
  575. outputColumnNames: _col0, _col1, _col6
  576. Position of Big Table: 1
  577. Select Operator
  578. expressions:
  579. expr: _col0
  580. type: int
  581. expr: _col1
  582. type: string
  583. expr: _col6
  584. type: string
  585. outputColumnNames: _col0, _col1, _col6
  586. Select Operator
  587. expressions:
  588. expr: _col0
  589. type: int
  590. expr: _col1
  591. type: string
  592. expr: _col6
  593. type: string
  594. outputColumnNames: _col0, _col1, _col2
  595. File Output Operator
  596. compressed: false
  597. GlobalTableId: 1
  598. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10002
  599. NumFilesPerFileSink: 1
  600. Stats Publishing Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10000/
  601. table:
  602. input format: org.apache.hadoop.mapred.TextInputFormat
  603. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  604. properties:
  605. bucket_count -1
  606. columns key,value1,value2
  607. columns.types string:string:string
  608. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  609. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  610. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  611. name default.bucketmapjoin_tmp_result
  612. numFiles 1
  613. numPartitions 0
  614. numRows 564
  615. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  616. serialization.format 1
  617. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  618. totalSize 11067
  619. transient_lastDdlTime 1297330506
  620. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  621. name: default.bucketmapjoin_tmp_result
  622. TotalFiles: 1
  623. GatherStats: true
  624. MultiFileSpray: false
  625. Local Work:
  626. Map Reduce Local Work
  627. Needs Tagging: false
  628. Path -> Alias:
  629. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08 [b]
  630. Path -> Partition:
  631. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08
  632. Partition
  633. base file name: ds=2008-04-08
  634. input format: org.apache.hadoop.mapred.TextInputFormat
  635. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  636. partition values:
  637. ds 2008-04-08
  638. properties:
  639. bucket_count 4
  640. bucket_field_name key
  641. columns key,value
  642. columns.types int:string
  643. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  644. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  645. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08
  646. name default.srcbucket_mapjoin_part
  647. partition_columns ds
  648. serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
  649. serialization.format 1
  650. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  651. transient_lastDdlTime 1297330480
  652. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  653. input format: org.apache.hadoop.mapred.TextInputFormat
  654. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  655. properties:
  656. bucket_count 4
  657. bucket_field_name key
  658. columns key,value
  659. columns.types int:string
  660. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  661. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  662. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part
  663. name default.srcbucket_mapjoin_part
  664. partition_columns ds
  665. serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
  666. serialization.format 1
  667. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  668. transient_lastDdlTime 1297330480
  669. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  670. name: default.srcbucket_mapjoin_part
  671. name: default.srcbucket_mapjoin_part
  672. Stage: Stage-5
  673. Conditional Operator
  674. Stage: Stage-4
  675. Move Operator
  676. files:
  677. hdfs directory: true
  678. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10002
  679. destination: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10000
  680. Stage: Stage-0
  681. Move Operator
  682. tables:
  683. replace: true
  684. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10000
  685. table:
  686. input format: org.apache.hadoop.mapred.TextInputFormat
  687. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  688. properties:
  689. bucket_count -1
  690. columns key,value1,value2
  691. columns.types string:string:string
  692. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  693. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  694. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  695. name default.bucketmapjoin_tmp_result
  696. numFiles 1
  697. numPartitions 0
  698. numRows 564
  699. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  700. serialization.format 1
  701. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  702. totalSize 11067
  703. transient_lastDdlTime 1297330506
  704. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  705. name: default.bucketmapjoin_tmp_result
  706. tmp directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10001
  707. Stage: Stage-2
  708. Stats-Aggr Operator
  709. Stats Aggregation Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10000/
  710. Stage: Stage-3
  711. Map Reduce
  712. Alias -> Map Operator Tree:
  713. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10002
  714. File Output Operator
  715. compressed: false
  716. GlobalTableId: 0
  717. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10000
  718. NumFilesPerFileSink: 1
  719. table:
  720. input format: org.apache.hadoop.mapred.TextInputFormat
  721. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  722. properties:
  723. bucket_count -1
  724. columns key,value1,value2
  725. columns.types string:string:string
  726. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  727. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  728. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  729. name default.bucketmapjoin_tmp_result
  730. numFiles 1
  731. numPartitions 0
  732. numRows 564
  733. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  734. serialization.format 1
  735. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  736. totalSize 11067
  737. transient_lastDdlTime 1297330506
  738. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  739. name: default.bucketmapjoin_tmp_result
  740. TotalFiles: 1
  741. GatherStats: false
  742. MultiFileSpray: false
  743. Needs Tagging: false
  744. Path -> Alias:
  745. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_6277373757642429866/-ext-10002 [pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-35-18_368_

Large files files are truncated, but you can click here to view the full file