PageRenderTime 60ms CodeModel.GetById 23ms RepoModel.GetById 0ms app.codeStats 0ms

/tags/release-0.2.0-rc0/hive/external/ql/src/test/results/clientpositive/bucketmapjoin4.q.out

#
text | 1013 lines | 989 code | 24 blank | 0 comment | 0 complexity | 570d96aceb6cb4a11e968199a42b5df6 MD5 | raw file
Possible License(s): Apache-2.0, BSD-3-Clause, JSON, CPL-1.0

Large files files are truncated, but you can click here to view the full file

  1. PREHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  2. PREHOOK: type: CREATETABLE
  3. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin(key int, value string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  4. POSTHOOK: type: CREATETABLE
  5. POSTHOOK: Output: default@srcbucket_mapjoin
  6. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  7. PREHOOK: type: LOAD
  8. PREHOOK: Output: default@srcbucket_mapjoin
  9. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin
  10. POSTHOOK: type: LOAD
  11. POSTHOOK: Output: default@srcbucket_mapjoin
  12. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  13. PREHOOK: type: LOAD
  14. PREHOOK: Output: default@srcbucket_mapjoin
  15. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin
  16. POSTHOOK: type: LOAD
  17. POSTHOOK: Output: default@srcbucket_mapjoin
  18. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  19. PREHOOK: type: CREATETABLE
  20. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 4 BUCKETS STORED AS TEXTFILE
  21. POSTHOOK: type: CREATETABLE
  22. POSTHOOK: Output: default@srcbucket_mapjoin_part
  23. PREHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  24. PREHOOK: type: LOAD
  25. PREHOOK: Output: default@srcbucket_mapjoin_part
  26. POSTHOOK: query: load data local inpath '../data/files/srcbucket20.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  27. POSTHOOK: type: LOAD
  28. POSTHOOK: Output: default@srcbucket_mapjoin_part
  29. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  30. PREHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  31. PREHOOK: type: LOAD
  32. PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  33. POSTHOOK: query: load data local inpath '../data/files/srcbucket21.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  34. POSTHOOK: type: LOAD
  35. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  36. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  37. PREHOOK: type: LOAD
  38. PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  39. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  40. POSTHOOK: type: LOAD
  41. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  42. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  43. PREHOOK: type: LOAD
  44. PREHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  45. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part partition(ds='2008-04-08')
  46. POSTHOOK: type: LOAD
  47. POSTHOOK: Output: default@srcbucket_mapjoin_part@ds=2008-04-08
  48. PREHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  49. PREHOOK: type: CREATETABLE
  50. POSTHOOK: query: CREATE TABLE srcbucket_mapjoin_part_2 (key int, value string) partitioned by (ds string) CLUSTERED BY (key) INTO 2 BUCKETS STORED AS TEXTFILE
  51. POSTHOOK: type: CREATETABLE
  52. POSTHOOK: Output: default@srcbucket_mapjoin_part_2
  53. PREHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  54. PREHOOK: type: LOAD
  55. PREHOOK: Output: default@srcbucket_mapjoin_part_2
  56. POSTHOOK: query: load data local inpath '../data/files/srcbucket22.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  57. POSTHOOK: type: LOAD
  58. POSTHOOK: Output: default@srcbucket_mapjoin_part_2
  59. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  60. PREHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  61. PREHOOK: type: LOAD
  62. PREHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  63. POSTHOOK: query: load data local inpath '../data/files/srcbucket23.txt' INTO TABLE srcbucket_mapjoin_part_2 partition(ds='2008-04-08')
  64. POSTHOOK: type: LOAD
  65. POSTHOOK: Output: default@srcbucket_mapjoin_part_2@ds=2008-04-08
  66. PREHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  67. PREHOOK: type: CREATETABLE
  68. POSTHOOK: query: create table bucketmapjoin_hash_result_1 (key bigint , value1 bigint, value2 bigint)
  69. POSTHOOK: type: CREATETABLE
  70. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  71. PREHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  72. PREHOOK: type: CREATETABLE
  73. POSTHOOK: query: create table bucketmapjoin_hash_result_2 (key bigint , value1 bigint, value2 bigint)
  74. POSTHOOK: type: CREATETABLE
  75. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  76. PREHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  77. PREHOOK: type: CREATETABLE
  78. POSTHOOK: query: create table bucketmapjoin_tmp_result (key string , value1 string, value2 string)
  79. POSTHOOK: type: CREATETABLE
  80. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  81. PREHOOK: query: explain extended
  82. insert overwrite table bucketmapjoin_tmp_result
  83. select /*+mapjoin(b)*/ a.key, a.value, b.value
  84. from srcbucket_mapjoin a join srcbucket_mapjoin b
  85. on a.key=b.key
  86. PREHOOK: type: QUERY
  87. POSTHOOK: query: explain extended
  88. insert overwrite table bucketmapjoin_tmp_result
  89. select /*+mapjoin(b)*/ a.key, a.value, b.value
  90. from srcbucket_mapjoin a join srcbucket_mapjoin b
  91. on a.key=b.key
  92. POSTHOOK: type: QUERY
  93. ABSTRACT SYNTAX TREE:
  94. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) b) (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST b))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
  95. STAGE DEPENDENCIES:
  96. Stage-7 is a root stage
  97. Stage-1 depends on stages: Stage-7
  98. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  99. Stage-4
  100. Stage-0 depends on stages: Stage-4, Stage-3
  101. Stage-2 depends on stages: Stage-0
  102. Stage-3
  103. STAGE PLANS:
  104. Stage: Stage-7
  105. Map Reduce Local Work
  106. Alias -> Map Local Tables:
  107. b
  108. Fetch Operator
  109. limit: -1
  110. Alias -> Map Local Operator Tree:
  111. b
  112. TableScan
  113. alias: b
  114. GatherStats: false
  115. HashTable Sink Operator
  116. condition expressions:
  117. 0 {key} {value}
  118. 1 {value}
  119. handleSkewJoin: false
  120. keys:
  121. 0 [Column[key]]
  122. 1 [Column[key]]
  123. Position of Big Table: 0
  124. Bucket Mapjoin Context:
  125. Alias Bucket Base File Name Mapping:
  126. b {srcbucket20.txt=[srcbucket20.txt], srcbucket21.txt=[srcbucket21.txt]}
  127. Alias Bucket File Name Mapping:
  128. b {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt]}
  129. Alias Bucket Output File Name Mapping:
  130. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt 0
  131. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt 1
  132. Stage: Stage-1
  133. Map Reduce
  134. Alias -> Map Operator Tree:
  135. a
  136. TableScan
  137. alias: a
  138. GatherStats: false
  139. Map Join Operator
  140. condition map:
  141. Inner Join 0 to 1
  142. condition expressions:
  143. 0 {key} {value}
  144. 1 {value}
  145. handleSkewJoin: false
  146. keys:
  147. 0 [Column[key]]
  148. 1 [Column[key]]
  149. outputColumnNames: _col0, _col1, _col5
  150. Position of Big Table: 0
  151. Select Operator
  152. expressions:
  153. expr: _col0
  154. type: int
  155. expr: _col1
  156. type: string
  157. expr: _col5
  158. type: string
  159. outputColumnNames: _col0, _col1, _col5
  160. Select Operator
  161. expressions:
  162. expr: _col0
  163. type: int
  164. expr: _col1
  165. type: string
  166. expr: _col5
  167. type: string
  168. outputColumnNames: _col0, _col1, _col2
  169. File Output Operator
  170. compressed: false
  171. GlobalTableId: 1
  172. directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002
  173. NumFilesPerFileSink: 1
  174. Stats Publishing Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000/
  175. table:
  176. input format: org.apache.hadoop.mapred.TextInputFormat
  177. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  178. properties:
  179. bucket_count -1
  180. columns key,value1,value2
  181. columns.types string:string:string
  182. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  183. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  184. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  185. name default.bucketmapjoin_tmp_result
  186. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  187. serialization.format 1
  188. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  189. transient_lastDdlTime 1306979244
  190. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  191. name: default.bucketmapjoin_tmp_result
  192. TotalFiles: 1
  193. GatherStats: true
  194. MultiFileSpray: false
  195. Local Work:
  196. Map Reduce Local Work
  197. Needs Tagging: false
  198. Path -> Alias:
  199. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin [a]
  200. Path -> Partition:
  201. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
  202. Partition
  203. base file name: srcbucket_mapjoin
  204. input format: org.apache.hadoop.mapred.TextInputFormat
  205. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  206. properties:
  207. bucket_count 2
  208. bucket_field_name key
  209. columns key,value
  210. columns.types int:string
  211. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  212. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  213. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
  214. name default.srcbucket_mapjoin
  215. serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
  216. serialization.format 1
  217. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  218. transient_lastDdlTime 1306979239
  219. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  220. input format: org.apache.hadoop.mapred.TextInputFormat
  221. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  222. properties:
  223. bucket_count 2
  224. bucket_field_name key
  225. columns key,value
  226. columns.types int:string
  227. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  228. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  229. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
  230. name default.srcbucket_mapjoin
  231. serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
  232. serialization.format 1
  233. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  234. transient_lastDdlTime 1306979239
  235. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  236. name: default.srcbucket_mapjoin
  237. name: default.srcbucket_mapjoin
  238. Stage: Stage-5
  239. Conditional Operator
  240. Stage: Stage-4
  241. Move Operator
  242. files:
  243. hdfs directory: true
  244. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002
  245. destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000
  246. Stage: Stage-0
  247. Move Operator
  248. tables:
  249. replace: true
  250. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000
  251. table:
  252. input format: org.apache.hadoop.mapred.TextInputFormat
  253. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  254. properties:
  255. bucket_count -1
  256. columns key,value1,value2
  257. columns.types string:string:string
  258. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  259. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  260. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  261. name default.bucketmapjoin_tmp_result
  262. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  263. serialization.format 1
  264. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  265. transient_lastDdlTime 1306979244
  266. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  267. name: default.bucketmapjoin_tmp_result
  268. tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10001
  269. Stage: Stage-2
  270. Stats-Aggr Operator
  271. Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000/
  272. Stage: Stage-3
  273. Map Reduce
  274. Alias -> Map Operator Tree:
  275. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002
  276. File Output Operator
  277. compressed: false
  278. GlobalTableId: 0
  279. directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10000
  280. NumFilesPerFileSink: 1
  281. table:
  282. input format: org.apache.hadoop.mapred.TextInputFormat
  283. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  284. properties:
  285. bucket_count -1
  286. columns key,value1,value2
  287. columns.types string:string:string
  288. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  289. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  290. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  291. name default.bucketmapjoin_tmp_result
  292. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  293. serialization.format 1
  294. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  295. transient_lastDdlTime 1306979244
  296. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  297. name: default.bucketmapjoin_tmp_result
  298. TotalFiles: 1
  299. GatherStats: false
  300. MultiFileSpray: false
  301. Needs Tagging: false
  302. Path -> Alias:
  303. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002]
  304. Path -> Partition:
  305. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-24_202_6585306882290425835/-ext-10002
  306. Partition
  307. base file name: -ext-10002
  308. input format: org.apache.hadoop.mapred.TextInputFormat
  309. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  310. properties:
  311. bucket_count -1
  312. columns key,value1,value2
  313. columns.types string:string:string
  314. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  315. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  316. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  317. name default.bucketmapjoin_tmp_result
  318. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  319. serialization.format 1
  320. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  321. transient_lastDdlTime 1306979244
  322. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  323. input format: org.apache.hadoop.mapred.TextInputFormat
  324. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  325. properties:
  326. bucket_count -1
  327. columns key,value1,value2
  328. columns.types string:string:string
  329. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  330. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  331. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  332. name default.bucketmapjoin_tmp_result
  333. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  334. serialization.format 1
  335. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  336. transient_lastDdlTime 1306979244
  337. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  338. name: default.bucketmapjoin_tmp_result
  339. name: default.bucketmapjoin_tmp_result
  340. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  341. select /*+mapjoin(b)*/ a.key, a.value, b.value
  342. from srcbucket_mapjoin a join srcbucket_mapjoin b
  343. on a.key=b.key
  344. PREHOOK: type: QUERY
  345. PREHOOK: Input: default@srcbucket_mapjoin
  346. PREHOOK: Output: default@bucketmapjoin_tmp_result
  347. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  348. select /*+mapjoin(b)*/ a.key, a.value, b.value
  349. from srcbucket_mapjoin a join srcbucket_mapjoin b
  350. on a.key=b.key
  351. POSTHOOK: type: QUERY
  352. POSTHOOK: Input: default@srcbucket_mapjoin
  353. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  354. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  355. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  356. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  357. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  358. PREHOOK: type: QUERY
  359. PREHOOK: Input: default@bucketmapjoin_tmp_result
  360. PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-33_354_3111033757385788525/-mr-10000
  361. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  362. POSTHOOK: type: QUERY
  363. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  364. POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-33_354_3111033757385788525/-mr-10000
  365. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  366. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  367. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  368. 464
  369. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  370. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  371. PREHOOK: type: QUERY
  372. PREHOOK: Input: default@bucketmapjoin_tmp_result
  373. PREHOOK: Output: default@bucketmapjoin_hash_result_1
  374. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_1
  375. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  376. POSTHOOK: type: QUERY
  377. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  378. POSTHOOK: Output: default@bucketmapjoin_hash_result_1
  379. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  380. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  381. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  382. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  383. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  384. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  385. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  386. select /*+mapjoin(b)*/ a.key, a.value, b.value
  387. from srcbucket_mapjoin a join srcbucket_mapjoin b
  388. on a.key=b.key
  389. PREHOOK: type: QUERY
  390. PREHOOK: Input: default@srcbucket_mapjoin
  391. PREHOOK: Output: default@bucketmapjoin_tmp_result
  392. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  393. select /*+mapjoin(b)*/ a.key, a.value, b.value
  394. from srcbucket_mapjoin a join srcbucket_mapjoin b
  395. on a.key=b.key
  396. POSTHOOK: type: QUERY
  397. POSTHOOK: Input: default@srcbucket_mapjoin
  398. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  399. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  400. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  401. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  402. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  403. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  404. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  405. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  406. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  407. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  408. PREHOOK: query: select count(1) from bucketmapjoin_tmp_result
  409. PREHOOK: type: QUERY
  410. PREHOOK: Input: default@bucketmapjoin_tmp_result
  411. PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-49_331_2976822432880371649/-mr-10000
  412. POSTHOOK: query: select count(1) from bucketmapjoin_tmp_result
  413. POSTHOOK: type: QUERY
  414. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  415. POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-49_331_2976822432880371649/-mr-10000
  416. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  417. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  418. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  419. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  420. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  421. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  422. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  423. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  424. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  425. 464
  426. PREHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  427. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  428. PREHOOK: type: QUERY
  429. PREHOOK: Input: default@bucketmapjoin_tmp_result
  430. PREHOOK: Output: default@bucketmapjoin_hash_result_2
  431. POSTHOOK: query: insert overwrite table bucketmapjoin_hash_result_2
  432. select sum(hash(key)), sum(hash(value1)), sum(hash(value2)) from bucketmapjoin_tmp_result
  433. POSTHOOK: type: QUERY
  434. POSTHOOK: Input: default@bucketmapjoin_tmp_result
  435. POSTHOOK: Output: default@bucketmapjoin_hash_result_2
  436. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  437. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  438. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  439. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  440. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  441. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  442. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  443. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  444. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  445. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  446. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  447. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  448. PREHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  449. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  450. on a.key = b.key
  451. PREHOOK: type: QUERY
  452. PREHOOK: Input: default@bucketmapjoin_hash_result_1
  453. PREHOOK: Input: default@bucketmapjoin_hash_result_2
  454. PREHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-56_317_7787039686001016086/-mr-10000
  455. POSTHOOK: query: select a.key-b.key, a.value1-b.value1, a.value2-b.value2
  456. from bucketmapjoin_hash_result_1 a left outer join bucketmapjoin_hash_result_2 b
  457. on a.key = b.key
  458. POSTHOOK: type: QUERY
  459. POSTHOOK: Input: default@bucketmapjoin_hash_result_1
  460. POSTHOOK: Input: default@bucketmapjoin_hash_result_2
  461. POSTHOOK: Output: file:/tmp/tomasz/hive_2011-06-01_18-47-56_317_7787039686001016086/-mr-10000
  462. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  463. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  464. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  465. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  466. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  467. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  468. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  469. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  470. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  471. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  472. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  473. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  474. 0 0 0
  475. PREHOOK: query: explain extended
  476. insert overwrite table bucketmapjoin_tmp_result
  477. select /*+mapjoin(a)*/ a.key, a.value, b.value
  478. from srcbucket_mapjoin a join srcbucket_mapjoin b
  479. on a.key=b.key
  480. PREHOOK: type: QUERY
  481. POSTHOOK: query: explain extended
  482. insert overwrite table bucketmapjoin_tmp_result
  483. select /*+mapjoin(a)*/ a.key, a.value, b.value
  484. from srcbucket_mapjoin a join srcbucket_mapjoin b
  485. on a.key=b.key
  486. POSTHOOK: type: QUERY
  487. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  488. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  489. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  490. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  491. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  492. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  493. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  494. POSTHOOK: Lineage: bucketmapjoin_tmp_result.key SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:key, type:int, comment:null), ]
  495. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  496. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value1 SIMPLE [(srcbucket_mapjoin)a.FieldSchema(name:value, type:string, comment:null), ]
  497. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  498. POSTHOOK: Lineage: bucketmapjoin_tmp_result.value2 SIMPLE [(srcbucket_mapjoin)b.FieldSchema(name:value, type:string, comment:null), ]
  499. ABSTRACT SYNTAX TREE:
  500. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) a) (TOK_TABREF (TOK_TABNAME srcbucket_mapjoin) b) (= (. (TOK_TABLE_OR_COL a) key) (. (TOK_TABLE_OR_COL b) key)))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME bucketmapjoin_tmp_result))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST a))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL a) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL b) value)))))
  501. STAGE DEPENDENCIES:
  502. Stage-7 is a root stage
  503. Stage-1 depends on stages: Stage-7
  504. Stage-5 depends on stages: Stage-1 , consists of Stage-4, Stage-3
  505. Stage-4
  506. Stage-0 depends on stages: Stage-4, Stage-3
  507. Stage-2 depends on stages: Stage-0
  508. Stage-3
  509. STAGE PLANS:
  510. Stage: Stage-7
  511. Map Reduce Local Work
  512. Alias -> Map Local Tables:
  513. a
  514. Fetch Operator
  515. limit: -1
  516. Alias -> Map Local Operator Tree:
  517. a
  518. TableScan
  519. alias: a
  520. GatherStats: false
  521. HashTable Sink Operator
  522. condition expressions:
  523. 0 {key} {value}
  524. 1 {value}
  525. handleSkewJoin: false
  526. keys:
  527. 0 [Column[key]]
  528. 1 [Column[key]]
  529. Position of Big Table: 1
  530. Bucket Mapjoin Context:
  531. Alias Bucket Base File Name Mapping:
  532. a {srcbucket20.txt=[srcbucket20.txt], srcbucket21.txt=[srcbucket21.txt]}
  533. Alias Bucket File Name Mapping:
  534. a {pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt], pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt=[pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt]}
  535. Alias Bucket Output File Name Mapping:
  536. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket20.txt 0
  537. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin/srcbucket21.txt 1
  538. Stage: Stage-1
  539. Map Reduce
  540. Alias -> Map Operator Tree:
  541. b
  542. TableScan
  543. alias: b
  544. GatherStats: false
  545. Map Join Operator
  546. condition map:
  547. Inner Join 0 to 1
  548. condition expressions:
  549. 0 {key} {value}
  550. 1 {value}
  551. handleSkewJoin: false
  552. keys:
  553. 0 [Column[key]]
  554. 1 [Column[key]]
  555. outputColumnNames: _col0, _col1, _col5
  556. Position of Big Table: 1
  557. Select Operator
  558. expressions:
  559. expr: _col0
  560. type: int
  561. expr: _col1
  562. type: string
  563. expr: _col5
  564. type: string
  565. outputColumnNames: _col0, _col1, _col5
  566. Select Operator
  567. expressions:
  568. expr: _col0
  569. type: int
  570. expr: _col1
  571. type: string
  572. expr: _col5
  573. type: string
  574. outputColumnNames: _col0, _col1, _col2
  575. File Output Operator
  576. compressed: false
  577. GlobalTableId: 1
  578. directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002
  579. NumFilesPerFileSink: 1
  580. Stats Publishing Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000/
  581. table:
  582. input format: org.apache.hadoop.mapred.TextInputFormat
  583. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  584. properties:
  585. bucket_count -1
  586. columns key,value1,value2
  587. columns.types string:string:string
  588. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  589. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  590. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  591. name default.bucketmapjoin_tmp_result
  592. numFiles 1
  593. numPartitions 0
  594. numRows 464
  595. rawDataSize 8519
  596. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  597. serialization.format 1
  598. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  599. totalSize 8983
  600. transient_lastDdlTime 1306979269
  601. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  602. name: default.bucketmapjoin_tmp_result
  603. TotalFiles: 1
  604. GatherStats: true
  605. MultiFileSpray: false
  606. Local Work:
  607. Map Reduce Local Work
  608. Needs Tagging: false
  609. Path -> Alias:
  610. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin [b]
  611. Path -> Partition:
  612. pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
  613. Partition
  614. base file name: srcbucket_mapjoin
  615. input format: org.apache.hadoop.mapred.TextInputFormat
  616. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  617. properties:
  618. bucket_count 2
  619. bucket_field_name key
  620. columns key,value
  621. columns.types int:string
  622. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  623. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  624. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
  625. name default.srcbucket_mapjoin
  626. serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
  627. serialization.format 1
  628. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  629. transient_lastDdlTime 1306979239
  630. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  631. input format: org.apache.hadoop.mapred.TextInputFormat
  632. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  633. properties:
  634. bucket_count 2
  635. bucket_field_name key
  636. columns key,value
  637. columns.types int:string
  638. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  639. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  640. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/srcbucket_mapjoin
  641. name default.srcbucket_mapjoin
  642. serialization.ddl struct srcbucket_mapjoin { i32 key, string value}
  643. serialization.format 1
  644. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  645. transient_lastDdlTime 1306979239
  646. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  647. name: default.srcbucket_mapjoin
  648. name: default.srcbucket_mapjoin
  649. Stage: Stage-5
  650. Conditional Operator
  651. Stage: Stage-4
  652. Move Operator
  653. files:
  654. hdfs directory: true
  655. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002
  656. destination: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000
  657. Stage: Stage-0
  658. Move Operator
  659. tables:
  660. replace: true
  661. source: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000
  662. table:
  663. input format: org.apache.hadoop.mapred.TextInputFormat
  664. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  665. properties:
  666. bucket_count -1
  667. columns key,value1,value2
  668. columns.types string:string:string
  669. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  670. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  671. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  672. name default.bucketmapjoin_tmp_result
  673. numFiles 1
  674. numPartitions 0
  675. numRows 464
  676. rawDataSize 8519
  677. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  678. serialization.format 1
  679. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  680. totalSize 8983
  681. transient_lastDdlTime 1306979269
  682. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  683. name: default.bucketmapjoin_tmp_result
  684. tmp directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10001
  685. Stage: Stage-2
  686. Stats-Aggr Operator
  687. Stats Aggregation Key Prefix: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000/
  688. Stage: Stage-3
  689. Map Reduce
  690. Alias -> Map Operator Tree:
  691. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002
  692. File Output Operator
  693. compressed: false
  694. GlobalTableId: 0
  695. directory: pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10000
  696. NumFilesPerFileSink: 1
  697. table:
  698. input format: org.apache.hadoop.mapred.TextInputFormat
  699. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  700. properties:
  701. bucket_count -1
  702. columns key,value1,value2
  703. columns.types string:string:string
  704. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  705. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  706. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  707. name default.bucketmapjoin_tmp_result
  708. numFiles 1
  709. numPartitions 0
  710. numRows 464
  711. rawDataSize 8519
  712. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  713. serialization.format 1
  714. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  715. totalSize 8983
  716. transient_lastDdlTime 1306979269
  717. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  718. name: default.bucketmapjoin_tmp_result
  719. TotalFiles: 1
  720. GatherStats: false
  721. MultiFileSpray: false
  722. Needs Tagging: false
  723. Path -> Alias:
  724. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002 [pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002]
  725. Path -> Partition:
  726. pfile:/data/users/tomasz/apache-hive/build/ql/scratchdir/hive_2011-06-01_18-47-59_537_2542627376244877759/-ext-10002
  727. Partition
  728. base file name: -ext-10002
  729. input format: org.apache.hadoop.mapred.TextInputFormat
  730. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  731. properties:
  732. bucket_count -1
  733. columns key,value1,value2
  734. columns.types string:string:string
  735. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  736. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  737. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  738. name default.bucketmapjoin_tmp_result
  739. numFiles 1
  740. numPartitions 0
  741. numRows 464
  742. rawDataSize 8519
  743. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  744. serialization.format 1
  745. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  746. totalSize 8983
  747. transient_lastDdlTime 1306979269
  748. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  749. input format: org.apache.hadoop.mapred.TextInputFormat
  750. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  751. properties:
  752. bucket_count -1
  753. columns key,value1,value2
  754. columns.types string:string:string
  755. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  756. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  757. location pfile:/data/users/tomasz/apache-hive/build/ql/test/data/warehouse/bucketmapjoin_tmp_result
  758. name default.bucketmapjoin_tmp_result
  759. numFiles 1
  760. numPartitions 0
  761. numRows 464
  762. rawDataSize 8519
  763. serialization.ddl struct bucketmapjoin_tmp_result { string key, string value1, string value2}
  764. serialization.format 1
  765. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  766. totalSize 8983
  767. transient_lastDdlTime 1306979269
  768. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  769. name: default.bucketmapjoin_tmp_result
  770. name: default.bucketmapjoin_tmp_result
  771. PREHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  772. select /*+mapjoin(a)*/ a.key, a.value, b.value
  773. from srcbucket_mapjoin a join srcbucket_mapjoin b
  774. on a.key=b.key
  775. PREHOOK: type: QUERY
  776. PREHOOK: Input: default@srcbucket_mapjoin
  777. PREHOOK: Output: default@bucketmapjoin_tmp_result
  778. POSTHOOK: query: insert overwrite table bucketmapjoin_tmp_result
  779. select /*+mapjoin(a)*/ a.key, a.value, b.value
  780. from srcbucket_mapjoin a join srcbucket_mapjoin b
  781. on a.key=b.key
  782. POSTHOOK: type: QUERY
  783. POSTHOOK: Input: default@srcbucket_mapjoin
  784. POSTHOOK: Output: default@bucketmapjoin_tmp_result
  785. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null), ]
  786. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value1 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value1, type:string, comment:null), ]
  787. POSTHOOK: Lineage: bucketmapjoin_hash_result_1.value2 EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:value2, type:string, comment:null), ]
  788. POSTHOOK: Lineage: bucketmapjoin_hash_result_2.key EXPRESSION [(bucketmapjoin_tmp_result)bucketmapjoin_tmp_result.FieldSchema(name:key, type:string, comment:null

Large files files are truncated, but you can click here to view the full file