blob: dc7f8328b05d5a1c0fdefad516f893e52d8d2f0a [file] [log] [blame]
buyingyic73348c2012-11-02 00:31:31 +00001-- create the tables and load the data
2create external table customer (C_CUSTKEY INT, C_NAME STRING, C_ADDRESS STRING, C_NATIONKEY INT, C_PHONE STRING, C_ACCTBAL DOUBLE, C_MKTSEGMENT STRING, C_COMMENT STRING) ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' STORED AS TEXTFILE LOCATION '/tpch/100/customer';
3create external table orders (O_ORDERKEY INT, O_CUSTKEY INT, O_ORDERSTATUS STRING, O_TOTALPRICE DOUBLE, O_ORDERDATE STRING, O_ORDERPRIORITY STRING, O_CLERK STRING, O_SHIPPRIORITY INT, O_COMMENT STRING) ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' STORED AS TEXTFILE LOCATION '/tpch/100/orders';
4
5-- create the result table
6create table q13_customer_distribution (c_count int, custdist int);
7
8-- the query
9insert overwrite table q13_customer_distribution
10select
11 c_count, count(1) as custdist
12from
13 (select
14 c_custkey, count(o_orderkey) as c_count
15 from
16 customer c left outer join orders o
17 on
18 c.c_custkey = o.o_custkey and not o.o_comment like '%special%requests%'
19 group by c_custkey
20 ) c_orders
21group by c_count
22order by custdist desc, c_count desc;
23
24DROP TABLE customer;
25DROP TABLE orders;
26DROP TABLE q13_customer_distribution;