buyingyi | c73348c | 2012-11-02 00:31:31 +0000 | [diff] [blame] | 1 | -- create the tables and load the data |
| 2 | create external table customer (C_CUSTKEY INT, C_NAME STRING, C_ADDRESS STRING, C_NATIONKEY INT, C_PHONE STRING, C_ACCTBAL DOUBLE, C_MKTSEGMENT STRING, C_COMMENT STRING) ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' STORED AS TEXTFILE LOCATION '/tpch/100/customer'; |
| 3 | create external table orders (O_ORDERKEY INT, O_CUSTKEY INT, O_ORDERSTATUS STRING, O_TOTALPRICE DOUBLE, O_ORDERDATE STRING, O_ORDERPRIORITY STRING, O_CLERK STRING, O_SHIPPRIORITY INT, O_COMMENT STRING) ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' STORED AS TEXTFILE LOCATION '/tpch/100/orders'; |
| 4 | |
| 5 | -- create the result table |
| 6 | create table q13_customer_distribution (c_count int, custdist int); |
| 7 | |
| 8 | -- the query |
| 9 | insert overwrite table q13_customer_distribution |
| 10 | select |
| 11 | c_count, count(1) as custdist |
| 12 | from |
| 13 | (select |
| 14 | c_custkey, count(o_orderkey) as c_count |
| 15 | from |
| 16 | customer c left outer join orders o |
| 17 | on |
| 18 | c.c_custkey = o.o_custkey and not o.o_comment like '%special%requests%' |
| 19 | group by c_custkey |
| 20 | ) c_orders |
| 21 | group by c_count |
| 22 | order by custdist desc, c_count desc; |
| 23 | |
| 24 | DROP TABLE customer; |
| 25 | DROP TABLE orders; |
| 26 | DROP TABLE q13_customer_distribution; |