PageRenderTime 51ms CodeModel.GetById 22ms RepoModel.GetById 0ms app.codeStats 0ms

/tags/release-0.0.0-rc0/hive/external/ql/src/test/results/clientpositive/bucketmapjoin1.q.out

#
text | 1026 lines | 1002 code | 24 blank | 0 comment | 0 complexity | 4f95c8fa54aebc315fabccc2b9bf42c1 MD5 | raw file
Possible License(s): Apache-2.0, BSD-3-Clause, JSON, CPL-1.0

Large files files are truncated, but you can click here to view the full file

  1. PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  2. PREHOOK: type: CREATETABLE
  3. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  4. POSTHOOK: type: CREATETABLE
  5. POSTHOOK: Output: default@srcbucket_mapjoin
  6. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  7. PREHOOK: type: LOAD
  8. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  9. POSTHOOK: type: LOAD
  10. POSTHOOK: Output: default@srcbucket_mapjoin
  11. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  12. PREHOOK: type: LOAD
  13. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  14. POSTHOOK: type: LOAD
  15. POSTHOOK: Output: default@srcbucket_mapjoin
  16. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  17. PREHOOK: type: CREATETABLE
  18. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  19. POSTHOOK: type: CREATETABLE
  20. POSTHOOK: Output: default@srcbucket_mapjoin_part
  21. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  22. PREHOOK: type: LOAD
  23. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  24. POSTHOOK: type: LOAD
  25. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  26. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  27. PREHOOK: type: LOAD
  28. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  29. POSTHOOK: type: LOAD
  30. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  31. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  32. PREHOOK: type: LOAD
  33. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  34. POSTHOOK: type: LOAD
  35. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  36. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  37. PREHOOK: type: LOAD
  38. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  39. POSTHOOK: type: LOAD
  40. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  41. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  42. PREHOOK: type: CREATETABLE
  43. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  44. POSTHOOK: type: CREATETABLE
  45. POSTHOOK: Output: default@srcbucket_mapjoin_part_2
  46. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  47. PREHOOK: type: LOAD
  48. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  49. POSTHOOK: type: LOAD
  50. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  51. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  52. PREHOOK: type: LOAD
  53. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  54. POSTHOOK: type: LOAD
  55. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  56. PREHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  57. PREHOOK: type: CREATETABLE
  58. POSTHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  59. POSTHOOK: type: CREATETABLE
  60. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  61. PREHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  62. PREHOOK: type: CREATETABLE
  63. POSTHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  64. POSTHOOK: type: CREATETABLE
  65. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  66. PREHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  67. PREHOOK: type: CREATETABLE
  68. POSTHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  69. POSTHOOK: type: CREATETABLE
  70. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  71. PREHOOK: query: explain extended
  72. insert overwrite table bucketmapjoin_tmp_result
  73. select /*+mapjoin(b)*/ a.key, a.value, b.value
  74. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  75. on a.key=b.key where b.ds="2008-04-08"
  76. PREHOOK: type: QUERY
  77. POSTHOOK: query: explain extended
  78. insert overwrite table bucketmapjoin_tmp_result
  79. select /*+mapjoin(b)*/ a.key, a.value, b.value
  80. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  81. on a.key=b.key where b.ds="2008-04-08"
  82. POSTHOOK: type: QUERY
  83. ABSTRACT SYNTAX TREE:
  84. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST b))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value))) (TOK_WHERE (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08"))))
  85. STAGE DEPENDENCIES:
  86. Stage-7 is a root stage
  87. Stage-1 depends on stages: Stage-7
  88. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  89. Stage-4
  90. Stage-0 depends on stages: Stage-4, Stage-3
  91. Stage-2 depends on stages: Stage-0
  92. Stage-3
  93. STAGE PLANS:
  94. Stage: Stage-7
  95. Map Reduce Local Work
  96. Alias -> Map Local Tables:
  97. b
  98. Fetch Operator
  99. limit: -1
  100. Alias -> Map Local Operator Tree:
  101. b
  102. TableScan
  103. alias: b
  104. GatherStats: false
  105. HashTable Sink Operator
  106. condition expressions:
  107. 0 {key} {value}
  108. 1 {value} {ds}
  109. handleSkewJoin: false
  110. keys:
  111. 0 [Column[key]]
  112. 1 [Column[key]]
  113. Position of Big Table: 0
  114. Bucket Mapjoin Context:
  115. Alias Bucket Base File Name Mapping:
  116. b {srcbucket20.txt=[srcbucket20.txt, srcbucket22.txt], srcbucket21.txt=[srcbucket21.txt, srcbucket23.txt]}
  117. Alias Bucket File Name Mapping:
  118. b {pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt, pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt, pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt]}
  119. Alias Bucket Output File Name Mapping:
  120. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt 0
  121. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt 1
  122. Stage: Stage-1
  123. Map Reduce
  124. Alias -> Map Operator Tree:
  125. a
  126. TableScan
  127. alias: a
  128. GatherStats: false
  129. Map Join Operator
  130. condition map:
  131. Inner Join 0 to 1
  132. condition expressions:
  133. 0 {key} {value}
  134. 1 {value} {ds}
  135. handleSkewJoin: false
  136. keys:
  137. 0 [Column[key]]
  138. 1 [Column[key]]
  139. outputColumnNames: _col0, _col1, _col5, _col6
  140. Position of Big Table: 0
  141. Select Operator
  142. expressions:
  143. expr: _col0
  144. type: int
  145. expr: _col1
  146. type: string
  147. expr: _col5
  148. type: string
  149. expr: _col6
  150. type: string
  151. outputColumnNames: _col0, _col1, _col5, _col6
  152. Filter Operator
  153. isSamplingPred: false
  154. predicate:
  155. expr: (_col6 = '2008-04-08')
  156. type: boolean
  157. Select Operator
  158. expressions:
  159. expr: _col0
  160. type: int
  161. expr: _col1
  162. type: string
  163. expr: _col5
  164. type: string
  165. outputColumnNames: _col0, _col1, _col2
  166. File Output Operator
  167. compressed: false
  168. GlobalTableId: 1
  169. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10002
  170. NumFilesPerFileSink: 1
  171. Stats Publishing Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10000/
  172. table:
  173. input format: org.apache.hadoop.mapred.TextInputFormat
  174. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  175. properties:
  176. bucket_count -1
  177. columns key,value1,value2
  178. columns.types string:string:string
  179. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  180. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  181. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  182. name default.bucketmapjoin_tmp_result
  183. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  184. serialization.format 1
  185. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  186. transient_lastDdlTime 1297330334
  187. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  188. name: default.bucketmapjoin_tmp_result
  189. TotalFiles: 1
  190. GatherStats: true
  191. MultiFileSpray: false
  192. Local Work:
  193. Map Reduce Local Work
  194. Needs Tagging: false
  195. Path -> Alias:
  196. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin [a]
  197. Path -> Partition:
  198. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin
  199. Partition
  200. base file name: srcbucket_mapjoin
  201. input format: org.apache.hadoop.mapred.TextInputFormat
  202. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  203. properties:
  204. bucket_count 2
  205. bucket_field_name key
  206. columns key,value
  207. columns.types int:string
  208. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  209. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  210. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin
  211. name default.srcbucket_mapjoin
  212. serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
  213. serialization.format 1
  214. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  215. transient_lastDdlTime 1297330330
  216. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  217. input format: org.apache.hadoop.mapred.TextInputFormat
  218. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  219. properties:
  220. bucket_count 2
  221. bucket_field_name key
  222. columns key,value
  223. columns.types int:string
  224. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  225. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  226. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin
  227. name default.srcbucket_mapjoin
  228. serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
  229. serialization.format 1
  230. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  231. transient_lastDdlTime 1297330330
  232. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  233. name: default.srcbucket_mapjoin
  234. name: default.srcbucket_mapjoin
  235. Stage: Stage-5
  236. Conditional Operator
  237. Stage: Stage-4
  238. Move Operator
  239. files:
  240. hdfs directory: true
  241. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10002
  242. destination: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10000
  243. Stage: Stage-0
  244. Move Operator
  245. tables:
  246. replace: true
  247. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10000
  248. table:
  249. input format: org.apache.hadoop.mapred.TextInputFormat
  250. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  251. properties:
  252. bucket_count -1
  253. columns key,value1,value2
  254. columns.types string:string:string
  255. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  256. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  257. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  258. name default.bucketmapjoin_tmp_result
  259. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  260. serialization.format 1
  261. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  262. transient_lastDdlTime 1297330334
  263. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  264. name: default.bucketmapjoin_tmp_result
  265. tmp directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10001
  266. Stage: Stage-2
  267. Stats-Aggr Operator
  268. Stats Aggregation Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10000/
  269. Stage: Stage-3
  270. Map Reduce
  271. Alias -> Map Operator Tree:
  272. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10002
  273. File Output Operator
  274. compressed: false
  275. GlobalTableId: 0
  276. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10000
  277. NumFilesPerFileSink: 1
  278. table:
  279. input format: org.apache.hadoop.mapred.TextInputFormat
  280. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  281. properties:
  282. bucket_count -1
  283. columns key,value1,value2
  284. columns.types string:string:string
  285. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  286. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  287. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  288. name default.bucketmapjoin_tmp_result
  289. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  290. serialization.format 1
  291. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  292. transient_lastDdlTime 1297330334
  293. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  294. name: default.bucketmapjoin_tmp_result
  295. TotalFiles: 1
  296. GatherStats: false
  297. MultiFileSpray: false
  298. Needs Tagging: false
  299. Path -> Alias:
  300. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10002 [pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10002]
  301. Path -> Partition:
  302. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-14_620_3045094958113552377/-ext-10002
  303. Partition
  304. base file name: -ext-10002
  305. input format: org.apache.hadoop.mapred.TextInputFormat
  306. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  307. properties:
  308. bucket_count -1
  309. columns key,value1,value2
  310. columns.types string:string:string
  311. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  312. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  313. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  314. name default.bucketmapjoin_tmp_result
  315. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  316. serialization.format 1
  317. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  318. transient_lastDdlTime 1297330334
  319. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  320. input format: org.apache.hadoop.mapred.TextInputFormat
  321. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  322. properties:
  323. bucket_count -1
  324. columns key,value1,value2
  325. columns.types string:string:string
  326. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  327. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  328. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  329. name default.bucketmapjoin_tmp_result
  330. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  331. serialization.format 1
  332. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  333. transient_lastDdlTime 1297330334
  334. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  335. name: default.bucketmapjoin_tmp_result
  336. name: default.bucketmapjoin_tmp_result
  337. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  338. select /*+mapjoin(b)*/ a.key, a.value, b.value
  339. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  340. on a.key=b.key where b.ds="2008-04-08"
  341. PREHOOK: type: QUERY
  342. PREHOOK: Input: default@srcbucket_mapjoin
  343. PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  344. PREHOOK: Output: default@bucketmapjoin_tmp_result
  345. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  346. select /*+mapjoin(b)*/ a.key, a.value, b.value
  347. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  348. on a.key=b.key where b.ds="2008-04-08"
  349. POSTHOOK: type: QUERY
  350. POSTHOOK: Input: default@srcbucket_mapjoin
  351. POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  352. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  353. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  354. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  355. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  356. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  357. PREHOOK: type: QUERY
  358. PREHOOK: Input: default@bucketmapjoin_tmp_result
  359. PREHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-32-22_115_3370231433781185993/-mr-10000
  360. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  361. POSTHOOK: type: QUERY
  362. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  363. POSTHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-32-22_115_3370231433781185993/-mr-10000
  364. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  365. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  366. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  367. 464
  368. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  369. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  370. PREHOOK: type: QUERY
  371. PREHOOK: Input: default@bucketmapjoin_tmp_result
  372. PREHOOK: Output: default@bucketmapjoin_hash_result_1
  373. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  374. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  375. POSTHOOK: type: QUERY
  376. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  377. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  378. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  379. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  380. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  381. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  382. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  383. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  384. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  385. select /*+mapjoin(b)*/ a.key, a.value, b.value
  386. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  387. on a.key=b.key where b.ds="2008-04-08"
  388. PREHOOK: type: QUERY
  389. PREHOOK: Input: default@srcbucket_mapjoin
  390. PREHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  391. PREHOOK: Output: default@bucketmapjoin_tmp_result
  392. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  393. select /*+mapjoin(b)*/ a.key, a.value, b.value
  394. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  395. on a.key=b.key where b.ds="2008-04-08"
  396. POSTHOOK: type: QUERY
  397. POSTHOOK: Input: default@srcbucket_mapjoin
  398. POSTHOOK: Input: default@srcbucket_mapjoin_part@ds=2008-04-08
  399. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  400. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  401. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  402. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  403. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  404. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  405. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  406. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  407. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  408. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  409. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  410. PREHOOK: type: QUERY
  411. PREHOOK: Input: default@bucketmapjoin_tmp_result
  412. PREHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-32-36_794_2065549773611334726/-mr-10000
  413. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  414. POSTHOOK: type: QUERY
  415. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  416. POSTHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-32-36_794_2065549773611334726/-mr-10000
  417. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  418. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  419. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  420. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  421. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  422. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  423. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  424. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  425. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  426. 464
  427. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  428. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  429. PREHOOK: type: QUERY
  430. PREHOOK: Input: default@bucketmapjoin_tmp_result
  431. PREHOOK: Output: default@bucketmapjoin_hash_result_2
  432. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  433. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  434. POSTHOOK: type: QUERY
  435. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  436. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  437. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  438. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  439. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  440. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  441. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  442. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  443. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  444. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  445. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  446. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  447. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  448. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  449. PREHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  450. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  451. on a.key = b.key
  452. PREHOOK: type: QUERY
  453. PREHOOK: Input: default@bucketmapjoin_hash_result_1
  454. PREHOOK: Input: default@bucketmapjoin_hash_result_2
  455. PREHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-32-44_744_7341074953851265954/-mr-10000
  456. POSTHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  457. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  458. on a.key = b.key
  459. POSTHOOK: type: QUERY
  460. POSTHOOK: Input: default@bucketmapjoin_hash_result_1
  461. POSTHOOK: Input: default@bucketmapjoin_hash_result_2
  462. POSTHOOK: Output: file:/tmp/sdong/hive_2011-02-10_01-32-44_744_7341074953851265954/-mr-10000
  463. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  464. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  465. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  466. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  467. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  468. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  469. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  470. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  471. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  472. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  473. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  474. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  475. 0 0 0
  476. PREHOOK: query: explain extended
  477. insert overwrite table bucketmapjoin_tmp_result
  478. select /*+mapjoin(a)*/ a.key, a.value, b.value
  479. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  480. on a.key=b.key where b.ds="2008-04-08"
  481. PREHOOK: type: QUERY
  482. POSTHOOK: query: explain extended
  483. insert overwrite table bucketmapjoin_tmp_result
  484. select /*+mapjoin(a)*/ a.key, a.value, b.value
  485. from srcbucket_mapjoin a join srcbucket_mapjoin_part b
  486. on a.key=b.key where b.ds="2008-04-08"
  487. POSTHOOK: type: QUERY
  488. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  489. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  490. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  491. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  492. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  493. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  494. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  495. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  496. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  497. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  498. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  499. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin_part)b.FieldSchema(name:value, type:string, comment:null), ]
  500. ABSTRACT SYNTAX TREE:
  501. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin_part) b) (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST a))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value))) (TOK_WHERE (= (. (TOK_TABLE_OR_COL b) ds) "2008-04-08"))))
  502. STAGE DEPENDENCIES:
  503. Stage-7 is a root stage
  504. Stage-1 depends on stages: Stage-7
  505. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  506. Stage-4
  507. Stage-0 depends on stages: Stage-4, Stage-3
  508. Stage-2 depends on stages: Stage-0
  509. Stage-3
  510. STAGE PLANS:
  511. Stage: Stage-7
  512. Map Reduce Local Work
  513. Alias -> Map Local Tables:
  514. a
  515. Fetch Operator
  516. limit: -1
  517. Alias -> Map Local Operator Tree:
  518. a
  519. TableScan
  520. alias: a
  521. GatherStats: false
  522. HashTable Sink Operator
  523. condition expressions:
  524. 0 {key} {value}
  525. 1 {value} {ds}
  526. handleSkewJoin: false
  527. keys:
  528. 0 [Column[key]]
  529. 1 [Column[key]]
  530. Position of Big Table: 1
  531. Bucket Mapjoin Context:
  532. Alias Bucket Base File Name Mapping:
  533. a {srcbucket20.txt=[srcbucket20.txt], srcbucket21.txt=[srcbucket21.txt], srcbucket22.txt=[srcbucket20.txt], srcbucket23.txt=[srcbucket21.txt]}
  534. Alias Bucket File Name Mapping:
  535. a {pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt], pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt=[pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt]}
  536. Alias Bucket Output File Name Mapping:
  537. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket20.txt 0
  538. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket21.txt 1
  539. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket22.txt 2
  540. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08/srcbucket23.txt 3
  541. Stage: Stage-1
  542. Map Reduce
  543. Alias -> Map Operator Tree:
  544. b
  545. TableScan
  546. alias: b
  547. GatherStats: false
  548. Map Join Operator
  549. condition map:
  550. Inner Join 0 to 1
  551. condition expressions:
  552. 0 {key} {value}
  553. 1 {value} {ds}
  554. handleSkewJoin: false
  555. keys:
  556. 0 [Column[key]]
  557. 1 [Column[key]]
  558. outputColumnNames: _col0, _col1, _col5, _col6
  559. Position of Big Table: 1
  560. Select Operator
  561. expressions:
  562. expr: _col0
  563. type: int
  564. expr: _col1
  565. type: string
  566. expr: _col5
  567. type: string
  568. expr: _col6
  569. type: string
  570. outputColumnNames: _col0, _col1, _col5, _col6
  571. Filter Operator
  572. isSamplingPred: false
  573. predicate:
  574. expr: (_col6 = '2008-04-08')
  575. type: boolean
  576. Select Operator
  577. expressions:
  578. expr: _col0
  579. type: int
  580. expr: _col1
  581. type: string
  582. expr: _col5
  583. type: string
  584. outputColumnNames: _col0, _col1, _col2
  585. File Output Operator
  586. compressed: false
  587. GlobalTableId: 1
  588. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10002
  589. NumFilesPerFileSink: 1
  590. Stats Publishing Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10000/
  591. table:
  592. input format: org.apache.hadoop.mapred.TextInputFormat
  593. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  594. properties:
  595. bucket_count -1
  596. columns key,value1,value2
  597. columns.types string:string:string
  598. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  599. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  600. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  601. name default.bucketmapjoin_tmp_result
  602. numFiles 1
  603. numPartitions 0
  604. numRows 464
  605. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  606. serialization.format 1
  607. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  608. totalSize 8983
  609. transient_lastDdlTime 1297330356
  610. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  611. name: default.bucketmapjoin_tmp_result
  612. TotalFiles: 1
  613. GatherStats: true
  614. MultiFileSpray: false
  615. Local Work:
  616. Map Reduce Local Work
  617. Needs Tagging: false
  618. Path -> Alias:
  619. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08 [b]
  620. Path -> Partition:
  621. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08
  622. Partition
  623. base file name: ds=2008-04-08
  624. input format: org.apache.hadoop.mapred.TextInputFormat
  625. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  626. partition values:
  627. ds 2008-04-08
  628. properties:
  629. bucket_count 4
  630. bucket_field_name key
  631. columns key,value
  632. columns.types int:string
  633. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  634. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  635. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part/ds=2008-04-08
  636. name default.srcbucket_mapjoin_part
  637. partition_columns ds
  638. serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
  639. serialization.format 1
  640. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  641. transient_lastDdlTime 1297330330
  642. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  643. input format: org.apache.hadoop.mapred.TextInputFormat
  644. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  645. properties:
  646. bucket_count 4
  647. bucket_field_name key
  648. columns key,value
  649. columns.types int:string
  650. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  651. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  652. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/srcbucket_mapjoin_part
  653. name default.srcbucket_mapjoin_part
  654. partition_columns ds
  655. serialization.ddl struct srcbucket_mapjoin_part { i32 key, string value}
  656. serialization.format 1
  657. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  658. transient_lastDdlTime 1297330330
  659. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  660. name: default.srcbucket_mapjoin_part
  661. name: default.srcbucket_mapjoin_part
  662. Stage: Stage-5
  663. Conditional Operator
  664. Stage: Stage-4
  665. Move Operator
  666. files:
  667. hdfs directory: true
  668. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10002
  669. destination: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10000
  670. Stage: Stage-0
  671. Move Operator
  672. tables:
  673. replace: true
  674. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10000
  675. table:
  676. input format: org.apache.hadoop.mapred.TextInputFormat
  677. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  678. properties:
  679. bucket_count -1
  680. columns key,value1,value2
  681. columns.types string:string:string
  682. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  683. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  684. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  685. name default.bucketmapjoin_tmp_result
  686. numFiles 1
  687. numPartitions 0
  688. numRows 464
  689. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  690. serialization.format 1
  691. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  692. totalSize 8983
  693. transient_lastDdlTime 1297330356
  694. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  695. name: default.bucketmapjoin_tmp_result
  696. tmp directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10001
  697. Stage: Stage-2
  698. Stats-Aggr Operator
  699. Stats Aggregation Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10000/
  700. Stage: Stage-3
  701. Map Reduce
  702. Alias -> Map Operator Tree:
  703. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10002
  704. File Output Operator
  705. compressed: false
  706. GlobalTableId: 0
  707. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10000
  708. NumFilesPerFileSink: 1
  709. table:
  710. input format: org.apache.hadoop.mapred.TextInputFormat
  711. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  712. properties:
  713. bucket_count -1
  714. columns key,value1,value2
  715. columns.types string:string:string
  716. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  717. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  718. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  719. name default.bucketmapjoin_tmp_result
  720. numFiles 1
  721. numPartitions 0
  722. numRows 464
  723. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  724. serialization.format 1
  725. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  726. totalSize 8983
  727. transient_lastDdlTime 1297330356
  728. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  729. name: default.bucketmapjoin_tmp_result
  730. TotalFiles: 1
  731. GatherStats: false
  732. MultiFileSpray: false
  733. Needs Tagging: false
  734. Path -> Alias:
  735. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10002 [pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10002]
  736. Path -> Partition:
  737. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_01-32-48_438_2652635181723360989/-ext-10002
  738. Partition
  739. base file name: -ext-10002
  740. input format: org.apache.hadoop.mapred.TextInputFormat
  741. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  742. properties:
  743. bucket_count -1
  744. columns key,value1,value2
  745. columns.types string:string:string
  746. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  747. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  748. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  749. name default.bucketmapjoin_tmp_result
  750. numFiles 1
  751. numPartitions 0
  752. numRows 464
  753. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  754. serialization.format 1
  755. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  756. t

Large files files are truncated, but you can click here to view the full file