CREATE TABLE sales (
id int auto_increment primary key,
country VARCHAR(255),
sales_date DATE,
sales_volume INT,
fix_costs INT
);
INSERT INTO sales
(country, sales_date, sales_volume, fix_costs
)
VALUES
("DE", "2020-01-03", "500", "0"),
("NL", "2020-01-03", "320", "0"),
("FR", "2020-01-03", "350", "0"),
("None", "2020-01-30", "0", "2000"),
("DE", "2020-02-15", "700", "0"),
("NL", "2020-02-15", "420", "0"),
("FR", "2020-02-15", "180", "0"),
("None", "2020-02-29", "0", "5000"),
("DE", "2020-03-27", "180", "0"),
("NL", "2020-03-27", "670", "0"),
("FR", "2020-03-27", "970", "0"),
("None", "2020-03-31", "0", "4000");
预期结果:
sales_date country sales_volume fix_costs
2020-01-03 DE 500 27.6 (=2000/31 = 64.5 * 0.42)
2020-01-03 FR 350 19.3 (=2000/31 = 64.5 * 0.30)
2020-01-03 NL 320 17.6 (=2000/31 = 64.5 * 0.28)
2020-02-15 DE 700 92.8 (=5000/29 = 172.4 * 0.54)
2020-02-15 FR 180 23.9 (=5000/29 = 172.4 * 0.14)
2020-02-15 NL 420 55.7 (=5000/29 = 172.4 * 0.32)
2020-03-27 DE 180 12.8 (=4000/31 = 129.0 * 0.10)
2020-03-27 FR 970 68.8 (=4000/31 = 129.0 * 0.53)
2020-03-27 NL 670 47.5 (=4000/31 = 129.0 * 0.37)
在上表中,我每月有fix_costs
。
现在,我想将每月的fix_costs
分别分配到每月的每天和每个国家/地区。
因此,我使用以下方法计算每月的fix_cost_per_day
:
SUM(fix_costs) / DAY(LAST_DAY(sales_date)) AS fix_cost_per_day
但是,我不知道如何将daily revenue_share per country
应用于fix_cost_per_day
。
我需要修改我的查询以达到预期结果:
SELECT
sales_date,
country,
SUM(sales_volume),
SUM(fix_costs) / DAY(LAST_DAY(sales_date)) AS fix_cost_per_day
FROM sales
GROUP BY 1,2;
答案 0 :(得分:1)
首先,您的currenet查询不会执行您想要的操作。看来您实际上确实需要fix_costs
上的每月窗口总和。所以我将从以下内容开始:
select
sales_date,
country,
sum(sales_volume),
sum(sum(fix_costs)) over(partition by year(sales_date), month(sales_date))
/ day(last_day(sales_date))
as fix_cost_per_day
from sales
group by 1,2;
这将产生:
sales_date | country | sum(sales_volume) | fix_cost_per_day :--------- | :------ | ----------------: | ---------------: 2020-01-03 | DE | 500 | 64.5161 2020-01-03 | FR | 350 | 64.5161 2020-01-03 | NL | 320 | 64.5161 2020-01-30 | None | 0 | 64.5161 2020-02-15 | DE | 700 | 172.4138 2020-02-15 | FR | 180 | 172.4138 2020-02-15 | NL | 420 | 172.4138 2020-02-29 | None | 0 | 172.4138 2020-03-27 | DE | 180 | 129.0323 2020-03-27 | FR | 970 | 129.0323 2020-03-27 | NL | 670 | 129.0323 2020-03-31 | None | 0 | 129.0323
从此处开始,您可以添加考虑“每个国家/地区的每日收入份额”的逻辑。据我了解,您的问题是:
select
sales_date,
country,
sum(sales_volume),
sum(sum(fix_costs)) over(partition by year(sales_date), month(sales_date))
/ day(last_day(sales_date))
* sum(sales_volume)
/ sum(sum(sales_volume)) over(partition by sales_date)
as fix_cost_per_day
from sales
group by 1,2;
返回:
sales_date | country | sum(sales_volume) | fix_cost_per_day :--------- | :------ | ----------------: | ---------------: 2020-01-03 | DE | 500 | 27.57099531 2020-01-03 | FR | 350 | 19.29969672 2020-01-03 | NL | 320 | 17.64543700 2020-01-30 | None | 0 | null 2020-02-15 | DE | 700 | 92.83819629 2020-02-15 | FR | 180 | 23.87267905 2020-02-15 | NL | 420 | 55.70291777 2020-02-29 | None | 0 | null 2020-03-27 | DE | 180 | 12.76143212 2020-03-27 | FR | 970 | 68.76993974 2020-03-27 | NL | 670 | 47.50088621 2020-03-31 | None | 0 | null
如果需要,可以通过将查询转到子查询并在外部查询中进行过滤来删除国家/地区'None'
的记录。
答案 1 :(得分:1)
要分配数据,可以使用窗口功能。您需要按月对各种值求和,然后求和并除:
SELECT sales_date, country,
SUM(sales_volume),
SUM(fix_costs) / DAY(LAST_DAY(sales_date)) AS fix_cost_per_day,
(SUM(SUM(fix_costs)) OVER (PARTITION BY yyyy, mm) / DAY(LAST_DAY(sales_date))) *
(SUM(sales_volume) / SUM(SUM(sales_volume)) OVER (PARTITION BY yyyy, mm)) as allocated
FROM (SELECT s.*, YEAR(sales_date) as yyyy, MONTH(sales_date) as mm
FROM sales s
) s
GROUP BY 1,2;
Here是db <>小提琴。
请注意,并非严格需要子查询。这对于按月处理分区很有帮助。