/tags/release-0.2.0-rc0/hive/external/ql/src/test/results/clientpositive/join35.q.out

# · text · 620 lines · 603 code · 17 blank · 0 comment · 0 complexity · 06655e99609b5e9631534c60bfae7927 MD5 · raw file

  1. PREHOOK: query: CREATE TABLE dest_j1(key STRING, value STRING, val2 INT) STORED AS TEXTFILE
  2. PREHOOK: type: CREATETABLE
  3. POSTHOOK: query: CREATE TABLE dest_j1(key STRING, value STRING, val2 INT) STORED AS TEXTFILE
  4. POSTHOOK: type: CREATETABLE
  5. POSTHOOK: Output: default@dest_j1
  6. PREHOOK: query: EXPLAIN EXTENDED
  7. INSERT OVERWRITE TABLE dest_j1
  8. SELECT /*+ MAPJOIN(x) */ x.key, x.value, subq1.cnt
  9. FROM
  10. ( SELECT x.key as key, count(1) as cnt from src x where x.key < 20 group by x.key
  11. UNION ALL
  12. SELECT x1.key as key, count(1) as cnt from src x1 where x1.key > 100 group by x1.key
  13. ) subq1
  14. JOIN src1 x ON (x.key = subq1.key)
  15. PREHOOK: type: QUERY
  16. POSTHOOK: query: EXPLAIN EXTENDED
  17. INSERT OVERWRITE TABLE dest_j1
  18. SELECT /*+ MAPJOIN(x) */ x.key, x.value, subq1.cnt
  19. FROM
  20. ( SELECT x.key as key, count(1) as cnt from src x where x.key < 20 group by x.key
  21. UNION ALL
  22. SELECT x1.key as key, count(1) as cnt from src x1 where x1.key > 100 group by x1.key
  23. ) subq1
  24. JOIN src1 x ON (x.key = subq1.key)
  25. POSTHOOK: type: QUERY
  26. ABSTRACT SYNTAX TREE:
  27. (TOK_QUERY (TOK_FROM (TOK_JOIN (TOK_SUBQUERY (TOK_UNION (TOK_QUERY (TOK_FROM (TOK_TABREF (TOK_TABNAME src) x)) (TOK_INSERT (TOK_DESTINATION (TOK_DIR TOK_TMP_FILE)) (TOK_SELECT (TOK_SELEXPR (. (TOK_TABLE_OR_COL x) key) key) (TOK_SELEXPR (TOK_FUNCTION count 1) cnt)) (TOK_WHERE (< (. (TOK_TABLE_OR_COL x) key) 20)) (TOK_GROUPBY (. (TOK_TABLE_OR_COL x) key)))) (TOK_QUERY (TOK_FROM (TOK_TABREF (TOK_TABNAME src) x1)) (TOK_INSERT (TOK_DESTINATION (TOK_DIR TOK_TMP_FILE)) (TOK_SELECT (TOK_SELEXPR (. (TOK_TABLE_OR_COL x1) key) key) (TOK_SELEXPR (TOK_FUNCTION count 1) cnt)) (TOK_WHERE (> (. (TOK_TABLE_OR_COL x1) key) 100)) (TOK_GROUPBY (. (TOK_TABLE_OR_COL x1) key))))) subq1) (TOK_TABREF (TOK_TABNAME src1) x) (= (. (TOK_TABLE_OR_COL x) key) (. (TOK_TABLE_OR_COL subq1) key)))) (TOK_INSERT (TOK_DESTINATION (TOK_TAB (TOK_TABNAME dest_j1))) (TOK_SELECT (TOK_HINTLIST (TOK_HINT TOK_MAPJOIN (TOK_HINTARGLIST x))) (TOK_SELEXPR (. (TOK_TABLE_OR_COL x) key)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL x) value)) (TOK_SELEXPR (. (TOK_TABLE_OR_COL subq1) cnt)))))
  28. STAGE DEPENDENCIES:
  29. Stage-1 is a root stage
  30. Stage-9 depends on stages: Stage-1, Stage-7
  31. Stage-2 depends on stages: Stage-9
  32. Stage-6 depends on stages: Stage-2 , consists of Stage-5, Stage-4
  33. Stage-5
  34. Stage-0 depends on stages: Stage-5, Stage-4
  35. Stage-3 depends on stages: Stage-0
  36. Stage-4
  37. Stage-7 is a root stage
  38. STAGE PLANS:
  39. Stage: Stage-1
  40. Map Reduce
  41. Alias -> Map Operator Tree:
  42. null-subquery1:subq1-subquery1:x
  43. TableScan
  44. alias: x
  45. GatherStats: false
  46. Filter Operator
  47. isSamplingPred: false
  48. predicate:
  49. expr: (key < 20)
  50. type: boolean
  51. Select Operator
  52. expressions:
  53. expr: key
  54. type: string
  55. outputColumnNames: key
  56. Group By Operator
  57. aggregations:
  58. expr: count(1)
  59. bucketGroup: false
  60. keys:
  61. expr: key
  62. type: string
  63. mode: hash
  64. outputColumnNames: _col0, _col1
  65. Reduce Output Operator
  66. key expressions:
  67. expr: _col0
  68. type: string
  69. sort order: +
  70. Map-reduce partition columns:
  71. expr: _col0
  72. type: string
  73. tag: -1
  74. value expressions:
  75. expr: _col1
  76. type: bigint
  77. Needs Tagging: false
  78. Path -> Alias:
  79. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src [null-subquery1:subq1-subquery1:x]
  80. Path -> Partition:
  81. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src
  82. Partition
  83. base file name: src
  84. input format: org.apache.hadoop.mapred.TextInputFormat
  85. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  86. properties:
  87. bucket_count -1
  88. columns key,value
  89. columns.types string:string
  90. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  91. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  92. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src
  93. name default.src
  94. serialization.ddl struct src { string key, string value}
  95. serialization.format 1
  96. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  97. transient_lastDdlTime 1297378968
  98. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  99. input format: org.apache.hadoop.mapred.TextInputFormat
  100. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  101. properties:
  102. bucket_count -1
  103. columns key,value
  104. columns.types string:string
  105. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  106. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  107. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src
  108. name default.src
  109. serialization.ddl struct src { string key, string value}
  110. serialization.format 1
  111. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  112. transient_lastDdlTime 1297378968
  113. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  114. name: default.src
  115. name: default.src
  116. Reduce Operator Tree:
  117. Group By Operator
  118. aggregations:
  119. expr: count(VALUE._col0)
  120. bucketGroup: false
  121. keys:
  122. expr: KEY._col0
  123. type: string
  124. mode: mergepartial
  125. outputColumnNames: _col0, _col1
  126. Select Operator
  127. expressions:
  128. expr: _col0
  129. type: string
  130. expr: _col1
  131. type: bigint
  132. outputColumnNames: _col0, _col1
  133. File Output Operator
  134. compressed: false
  135. GlobalTableId: 0
  136. directory: file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10002
  137. NumFilesPerFileSink: 1
  138. table:
  139. input format: org.apache.hadoop.mapred.SequenceFileInputFormat
  140. output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
  141. properties:
  142. columns _col0,_col1
  143. columns.types string,bigint
  144. escape.delim \
  145. TotalFiles: 1
  146. GatherStats: false
  147. MultiFileSpray: false
  148. Stage: Stage-9
  149. Map Reduce Local Work
  150. Alias -> Map Local Tables:
  151. x
  152. Fetch Operator
  153. limit: -1
  154. Alias -> Map Local Operator Tree:
  155. x
  156. TableScan
  157. alias: x
  158. GatherStats: false
  159. HashTable Sink Operator
  160. condition expressions:
  161. 0 {_col1}
  162. 1 {key} {value}
  163. handleSkewJoin: false
  164. keys:
  165. 0 [Column[_col0]]
  166. 1 [Column[key]]
  167. Position of Big Table: 0
  168. Stage: Stage-2
  169. Map Reduce
  170. Alias -> Map Operator Tree:
  171. file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10002
  172. Union
  173. Map Join Operator
  174. condition map:
  175. Inner Join 0 to 1
  176. condition expressions:
  177. 0 {_col1}
  178. 1 {key} {value}
  179. handleSkewJoin: false
  180. keys:
  181. 0 [Column[_col0]]
  182. 1 [Column[key]]
  183. outputColumnNames: _col1, _col2, _col3
  184. Position of Big Table: 0
  185. Select Operator
  186. expressions:
  187. expr: _col1
  188. type: bigint
  189. expr: _col2
  190. type: string
  191. expr: _col3
  192. type: string
  193. outputColumnNames: _col1, _col2, _col3
  194. Select Operator
  195. expressions:
  196. expr: _col2
  197. type: string
  198. expr: _col3
  199. type: string
  200. expr: _col1
  201. type: bigint
  202. outputColumnNames: _col0, _col1, _col2
  203. Select Operator
  204. expressions:
  205. expr: _col0
  206. type: string
  207. expr: _col1
  208. type: string
  209. expr: UDFToInteger(_col2)
  210. type: int
  211. outputColumnNames: _col0, _col1, _col2
  212. File Output Operator
  213. compressed: false
  214. GlobalTableId: 1
  215. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10003
  216. NumFilesPerFileSink: 1
  217. Stats Publishing Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10000/
  218. table:
  219. input format: org.apache.hadoop.mapred.TextInputFormat
  220. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  221. properties:
  222. bucket_count -1
  223. columns key,value,val2
  224. columns.types string:string:int
  225. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  226. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  227. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/dest_j1
  228. name default.dest_j1
  229. serialization.ddl struct dest_j1 { string key, string value, i32 val2}
  230. serialization.format 1
  231. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  232. transient_lastDdlTime 1297382768
  233. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  234. name: default.dest_j1
  235. TotalFiles: 1
  236. GatherStats: true
  237. MultiFileSpray: false
  238. file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10004
  239. Union
  240. Map Join Operator
  241. condition map:
  242. Inner Join 0 to 1
  243. condition expressions:
  244. 0 {_col1}
  245. 1 {key} {value}
  246. handleSkewJoin: false
  247. keys:
  248. 0 [Column[_col0]]
  249. 1 [Column[key]]
  250. outputColumnNames: _col1, _col2, _col3
  251. Position of Big Table: 0
  252. Select Operator
  253. expressions:
  254. expr: _col1
  255. type: bigint
  256. expr: _col2
  257. type: string
  258. expr: _col3
  259. type: string
  260. outputColumnNames: _col1, _col2, _col3
  261. Select Operator
  262. expressions:
  263. expr: _col2
  264. type: string
  265. expr: _col3
  266. type: string
  267. expr: _col1
  268. type: bigint
  269. outputColumnNames: _col0, _col1, _col2
  270. Select Operator
  271. expressions:
  272. expr: _col0
  273. type: string
  274. expr: _col1
  275. type: string
  276. expr: UDFToInteger(_col2)
  277. type: int
  278. outputColumnNames: _col0, _col1, _col2
  279. File Output Operator
  280. compressed: false
  281. GlobalTableId: 1
  282. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10003
  283. NumFilesPerFileSink: 1
  284. Stats Publishing Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10000/
  285. table:
  286. input format: org.apache.hadoop.mapred.TextInputFormat
  287. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  288. properties:
  289. bucket_count -1
  290. columns key,value,val2
  291. columns.types string:string:int
  292. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  293. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  294. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/dest_j1
  295. name default.dest_j1
  296. serialization.ddl struct dest_j1 { string key, string value, i32 val2}
  297. serialization.format 1
  298. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  299. transient_lastDdlTime 1297382768
  300. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  301. name: default.dest_j1
  302. TotalFiles: 1
  303. GatherStats: true
  304. MultiFileSpray: false
  305. Local Work:
  306. Map Reduce Local Work
  307. Needs Tagging: false
  308. Path -> Alias:
  309. file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10002 [file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10002]
  310. file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10004 [file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10004]
  311. Path -> Partition:
  312. file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10002
  313. Partition
  314. base file name: -mr-10002
  315. input format: org.apache.hadoop.mapred.SequenceFileInputFormat
  316. output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
  317. properties:
  318. columns _col0,_col1
  319. columns.types string,bigint
  320. escape.delim \
  321. input format: org.apache.hadoop.mapred.SequenceFileInputFormat
  322. output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
  323. properties:
  324. columns _col0,_col1
  325. columns.types string,bigint
  326. escape.delim \
  327. file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10004
  328. Partition
  329. base file name: -mr-10004
  330. input format: org.apache.hadoop.mapred.SequenceFileInputFormat
  331. output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
  332. properties:
  333. columns _col0,_col1
  334. columns.types string,bigint
  335. escape.delim \
  336. input format: org.apache.hadoop.mapred.SequenceFileInputFormat
  337. output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
  338. properties:
  339. columns _col0,_col1
  340. columns.types string,bigint
  341. escape.delim \
  342. Stage: Stage-6
  343. Conditional Operator
  344. Stage: Stage-5
  345. Move Operator
  346. files:
  347. hdfs directory: true
  348. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10003
  349. destination: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10000
  350. Stage: Stage-0
  351. Move Operator
  352. tables:
  353. replace: true
  354. source: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10000
  355. table:
  356. input format: org.apache.hadoop.mapred.TextInputFormat
  357. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  358. properties:
  359. bucket_count -1
  360. columns key,value,val2
  361. columns.types string:string:int
  362. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  363. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  364. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/dest_j1
  365. name default.dest_j1
  366. serialization.ddl struct dest_j1 { string key, string value, i32 val2}
  367. serialization.format 1
  368. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  369. transient_lastDdlTime 1297382768
  370. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  371. name: default.dest_j1
  372. tmp directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10001
  373. Stage: Stage-3
  374. Stats-Aggr Operator
  375. Stats Aggregation Key Prefix: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10000/
  376. Stage: Stage-4
  377. Map Reduce
  378. Alias -> Map Operator Tree:
  379. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10003
  380. File Output Operator
  381. compressed: false
  382. GlobalTableId: 0
  383. directory: pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10000
  384. NumFilesPerFileSink: 1
  385. table:
  386. input format: org.apache.hadoop.mapred.TextInputFormat
  387. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  388. properties:
  389. bucket_count -1
  390. columns key,value,val2
  391. columns.types string:string:int
  392. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  393. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  394. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/dest_j1
  395. name default.dest_j1
  396. serialization.ddl struct dest_j1 { string key, string value, i32 val2}
  397. serialization.format 1
  398. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  399. transient_lastDdlTime 1297382768
  400. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  401. name: default.dest_j1
  402. TotalFiles: 1
  403. GatherStats: false
  404. MultiFileSpray: false
  405. Needs Tagging: false
  406. Path -> Alias:
  407. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10003 [pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10003]
  408. Path -> Partition:
  409. pfile:/data/users/sdong/www/open-source-hive1/build/ql/scratchdir/hive_2011-02-10_16-06-08_256_5728117320203012463/-ext-10003
  410. Partition
  411. base file name: -ext-10003
  412. input format: org.apache.hadoop.mapred.TextInputFormat
  413. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  414. properties:
  415. bucket_count -1
  416. columns key,value,val2
  417. columns.types string:string:int
  418. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  419. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  420. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/dest_j1
  421. name default.dest_j1
  422. serialization.ddl struct dest_j1 { string key, string value, i32 val2}
  423. serialization.format 1
  424. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  425. transient_lastDdlTime 1297382768
  426. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  427. input format: org.apache.hadoop.mapred.TextInputFormat
  428. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  429. properties:
  430. bucket_count -1
  431. columns key,value,val2
  432. columns.types string:string:int
  433. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  434. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  435. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/dest_j1
  436. name default.dest_j1
  437. serialization.ddl struct dest_j1 { string key, string value, i32 val2}
  438. serialization.format 1
  439. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  440. transient_lastDdlTime 1297382768
  441. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  442. name: default.dest_j1
  443. name: default.dest_j1
  444. Stage: Stage-7
  445. Map Reduce
  446. Alias -> Map Operator Tree:
  447. null-subquery2:subq1-subquery2:x1
  448. TableScan
  449. alias: x1
  450. GatherStats: false
  451. Filter Operator
  452. isSamplingPred: false
  453. predicate:
  454. expr: (key > 100)
  455. type: boolean
  456. Select Operator
  457. expressions:
  458. expr: key
  459. type: string
  460. outputColumnNames: key
  461. Group By Operator
  462. aggregations:
  463. expr: count(1)
  464. bucketGroup: false
  465. keys:
  466. expr: key
  467. type: string
  468. mode: hash
  469. outputColumnNames: _col0, _col1
  470. Reduce Output Operator
  471. key expressions:
  472. expr: _col0
  473. type: string
  474. sort order: +
  475. Map-reduce partition columns:
  476. expr: _col0
  477. type: string
  478. tag: -1
  479. value expressions:
  480. expr: _col1
  481. type: bigint
  482. Needs Tagging: false
  483. Path -> Alias:
  484. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src [null-subquery2:subq1-subquery2:x1]
  485. Path -> Partition:
  486. pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src
  487. Partition
  488. base file name: src
  489. input format: org.apache.hadoop.mapred.TextInputFormat
  490. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  491. properties:
  492. bucket_count -1
  493. columns key,value
  494. columns.types string:string
  495. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  496. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  497. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src
  498. name default.src
  499. serialization.ddl struct src { string key, string value}
  500. serialization.format 1
  501. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  502. transient_lastDdlTime 1297378968
  503. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  504. input format: org.apache.hadoop.mapred.TextInputFormat
  505. output format: org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  506. properties:
  507. bucket_count -1
  508. columns key,value
  509. columns.types string:string
  510. file.inputformat org.apache.hadoop.mapred.TextInputFormat
  511. file.outputformat org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat
  512. location pfile:/data/users/sdong/www/open-source-hive1/build/ql/test/data/warehouse/src
  513. name default.src
  514. serialization.ddl struct src { string key, string value}
  515. serialization.format 1
  516. serialization.lib org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  517. transient_lastDdlTime 1297378968
  518. serde: org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe
  519. name: default.src
  520. name: default.src
  521. Reduce Operator Tree:
  522. Group By Operator
  523. aggregations:
  524. expr: count(VALUE._col0)
  525. bucketGroup: false
  526. keys:
  527. expr: KEY._col0
  528. type: string
  529. mode: mergepartial
  530. outputColumnNames: _col0, _col1
  531. Select Operator
  532. expressions:
  533. expr: _col0
  534. type: string
  535. expr: _col1
  536. type: bigint
  537. outputColumnNames: _col0, _col1
  538. File Output Operator
  539. compressed: false
  540. GlobalTableId: 0
  541. directory: file:/tmp/sdong/hive_2011-02-10_16-06-08_256_5728117320203012463/-mr-10004
  542. NumFilesPerFileSink: 1
  543. table:
  544. input format: org.apache.hadoop.mapred.SequenceFileInputFormat
  545. output format: org.apache.hadoop.hive.ql.io.HiveSequenceFileOutputFormat
  546. properties:
  547. columns _col0,_col1
  548. columns.types string,bigint
  549. escape.delim \
  550. TotalFiles: 1
  551. GatherStats: false
  552. MultiFileSpray: false
  553. PREHOOK: query: INSERT OVERWRITE TABLE dest_j1
  554. SELECT /*+ MAPJOIN(x) */ x.key, x.value, subq1.cnt
  555. FROM
  556. ( SELECT x.key as key, count(1) as cnt from src x where x.key < 20 group by x.key
  557. UNION ALL
  558. SELECT x1.key as key, count(1) as cnt from src x1 where x1.key > 100 group by x1.key
  559. ) subq1
  560. JOIN src1 x ON (x.key = subq1.key)
  561. PREHOOK: type: QUERY
  562. PREHOOK: Input: default@src
  563. PREHOOK: Input: default@src1
  564. PREHOOK: Output: default@dest_j1
  565. POSTHOOK: query: INSERT OVERWRITE TABLE dest_j1
  566. SELECT /*+ MAPJOIN(x) */ x.key, x.value, subq1.cnt
  567. FROM
  568. ( SELECT x.key as key, count(1) as cnt from src x where x.key < 20 group by x.key
  569. UNION ALL
  570. SELECT x1.key as key, count(1) as cnt from src x1 where x1.key > 100 group by x1.key
  571. ) subq1
  572. JOIN src1 x ON (x.key = subq1.key)
  573. POSTHOOK: type: QUERY
  574. POSTHOOK: Input: default@src
  575. POSTHOOK: Input: default@src1
  576. POSTHOOK: Output: default@dest_j1
  577. POSTHOOK: Lineage: dest_j1.key SIMPLE [(src1)x.FieldSchema(name:key, type:string, comment:default), ]
  578. POSTHOOK: Lineage: dest_j1.val2 EXPRESSION [(src)x.null, (src)x1.null, ]
  579. POSTHOOK: Lineage: dest_j1.value SIMPLE [(src1)x.FieldSchema(name:value, type:string, comment:default), ]
  580. PREHOOK: query: select * from dest_j1 x order by x.key
  581. PREHOOK: type: QUERY
  582. PREHOOK: Input: default@dest_j1
  583. PREHOOK: Output: file:/tmp/sdong/hive_2011-02-10_16-06-21_981_8339275278749703354/-mr-10000
  584. POSTHOOK: query: select * from dest_j1 x order by x.key
  585. POSTHOOK: type: QUERY
  586. POSTHOOK: Input: default@dest_j1
  587. POSTHOOK: Output: file:/tmp/sdong/hive_2011-02-10_16-06-21_981_8339275278749703354/-mr-10000
  588. POSTHOOK: Lineage: dest_j1.key SIMPLE [(src1)x.FieldSchema(name:key, type:string, comment:default), ]
  589. POSTHOOK: Lineage: dest_j1.val2 EXPRESSION [(src)x.null, (src)x1.null, ]
  590. POSTHOOK: Lineage: dest_j1.value SIMPLE [(src1)x.FieldSchema(name:value, type:string, comment:default), ]
  591. 128 3
  592. 146 val_146 2
  593. 150 val_150 1
  594. 213 val_213 2
  595. 224 2
  596. 238 val_238 2
  597. 255 val_255 2
  598. 273 val_273 3
  599. 278 val_278 2
  600. 311 val_311 3
  601. 369 3
  602. 401 val_401 5
  603. 406 val_406 4