blob: b38ba2c47adb76e0ef2847101e7af6a661a97134 [file] [log] [blame]
buyingyi5df938f2013-03-24 07:20:08 +00001DROP TABLE lineitem;
2DROP TABLE supplier;
3DROP TABLE revenue;
4DROP TABLE max_revenue;
5DROP TABLE q15_top_supplier;
6
7-- create the tables and load the data
8create external table lineitem (L_ORDERKEY INT, L_PARTKEY INT, L_SUPPKEY INT, L_LINENUMBER INT, L_QUANTITY DOUBLE, L_EXTENDEDPRICE DOUBLE, L_DISCOUNT DOUBLE, L_TAX DOUBLE, L_RETURNFLAG STRING, L_LINESTATUS STRING, L_SHIPDATE STRING, L_COMMITDATE STRING, L_RECEIPTDATE STRING, L_SHIPINSTRUCT STRING, L_SHIPMODE STRING, L_COMMENT STRING) ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' STORED AS TEXTFILE LOCATION '/tpch/10/lineitem';
9create external table supplier (S_SUPPKEY INT, S_NAME STRING, S_ADDRESS STRING, S_NATIONKEY INT, S_PHONE STRING, S_ACCTBAL DOUBLE, S_COMMENT STRING) ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' STORED AS TEXTFILE LOCATION '/tpch/10/supplier';
10
11-- create result tables
12create table revenue(supplier_no int, total_revenue double);
13create table max_revenue(max_revenue double);
14create table q15_top_supplier(s_suppkey int, s_name string, s_address string, s_phone string, total_revenue double);
15
16
17set mapred.min.split.size=536870912;
18
19-- the query
20insert overwrite table revenue
21select
22 l_suppkey as supplier_no, sum(l_extendedprice * (1 - l_discount)) as total_revenue
23from
24 lineitem
25where
26 l_shipdate >= '1996-01-01' and l_shipdate < '1996-04-01'
27group by l_suppkey;
28
29insert overwrite table max_revenue
30select
31 max(total_revenue)
32from
33 revenue;
34
35insert overwrite table q15_top_supplier
36select
37 s_suppkey, s_name, s_address, s_phone, total_revenue
38from supplier s join revenue r
39 on
40 s.s_suppkey = r.supplier_no
41 join max_revenue m
42 on
43 r.total_revenue = m.max_revenue
44order by s_suppkey;
45