CREATE TABLE stock(
ordernumber string,--订单号
locationid string,--交易位置
dateID string --交易日期
)
ROW FORMAT DELIMITED FIELDS TERMINATED BY ','
LINES TERMINATED BY '\n' ;
CREATE TABLE stockdetail(
ordernumber string,--订单号
rownum int,--行号
itemid string, --货品
qty int, --数量
price int, --价格
amount int --总金额
) ROW FORMAT DELIMITED FIELDS TERMINATED BY ','
LINES TERMINATED BY '\n' ;
创建表,导入数据
load data local inpath '/home/zkpk/tbdata/sdate.txt'
overwrite into table sdate;
load data local inpath '/home/zkpk/tbdata/stock.txt'
overwrite into table stock;
load data local inpath '/home/zkpk/tbdata/stockdetail.txt'
overwrite into table stockdetail;
1、计算所有订单每年的总金额
算法分析:
要计算所有订单每年的总金额,首先需要获取所有订单的订单号、订单日期和订单金信息,
然后把这些信息和日期表进行关联,
获取年份信息,最后根据这四个列按年份归组统计获取所有订单每年的总金额。
关于三张表:stock a, stockdetail b, sdate c
select c.theyear,sum(b.amount)
from stock a,stockdetail b,sdate c
where a.ordernumber=b.ordernumber and a.dateid=c.dateid
group by c.theyear order by c.theyear;
该算法分为两步:
1.按照日期和订单号进行归组计算,
获取所有订单每天的销售数据;
stock a,stockdetail b
select a.dateid, a.ordernumber,sum(b.amount) as sumofamount
from stock a,stockdetail b
where a.ordernumber=b.ordernumber
group by a.dateid,a.ordernumber;
2.把第一步获取的数据和日期表进行关联获取的年份信息,
然后按照年份进行归组,使用Max函数,获取所有订单每年最大金额订单的销售额。
sdate c,第一步获取的数据 d
select c.theyear,max(d.sumofamount) from sdate c,
(select a.dateid, a.ordernumber,sum(b.amount) as sumofamount
from stock a,stockdetail b
where a.ordernumber=b.ordernumber
group by a.dateid,a.ordernumber)d
where c.dateid=d.dateid
group by c.theyear order by c.theyear;
select c.theyear,c.thequot,sum(b.amount) as sumofamount
from stock a,stockdetail b,sdate c
where a.ordernumber=b.ordernumber and a.dateid=c.dateid
group by c.theyear,c.thequot
order by sumofamount desc limit 10;
select a.ordernumber,sum(b.amount) as sumofamount
from stock a,stockdetail b
where a.ordernumber=b.ordernumber
group by a.ordernumber
having sumofamount>100000;
Result:
HMJSL00009024
119058
HMJSL00009958
159126
5、所有订单中每年最畅销货品
第一步:
统计出每年每种货品的销售总金额
stock a,stockdetail b,sdate c
===================================
select c.theyear,b.itemid,sum(b.amount) as sumofamount
from stock a,stockdetail b,sdate c
where a.ordernumber=b.ordernumber and a.dateid=c.dateid
group by c.theyear,b.itemid;
第二步:
在第一步的数据上,统计出每年最大的销售总金额
将第一步的数据集起别名为d;
select d.theyear,max(sumofamount) as maxofamount from
(select c.theyear,b.itemid,sum(b.amount) as sumofamount
from stock a,stockdetail b,sdate c
where a.ordernumber=b.ordernumber and a.dateid=c.dateid
group by c.theyear,b.itemid) d
group by d.theyear;
第三步:所有订单中每年最畅销货品
e:每年每种货品的销售总金额
f:每年最大的销售总金额
select distinct e.theyear,e.itemid,f.maxofamount from
(select c.theyear,b.itemid,
sum(b.amount) as sumofamount from stock a,stockdetail b,sdate c
where a.ordernumber=b.ordernumber and a.dateid=c.dateid
group by c.theyear,b.itemid) e,
(select d.theyear,max(d.sumofamount) as maxofamount from
(select c.theyear,b.itemid,sum(b.amount) as sumofamount
from stock a,stockdetail b,sdate c
where a.ordernumber=b.ordernumber and a.dateid=c.dateid
group by c.theyear,b.itemid) d
group by d.theyear) f
where e.theyear=f.theyear and e.sumofamount=f.maxofamount
order by e.theyear;