Oracle 上的条件 SUM
Conditional SUM on Oracle
我正在尝试使用条件 SUM 进行查询。 SUM 需要大于 15,然后重置它。像这样:
A | 3 | 3
B | 7 | 10
C | 6 | 16 -- ====
D | 5 | 5
E | 9 | 14
F | 3 | 17 -- ====
G | 8 | 8
我该怎么做?
使用递归 cte:
DROP TABLE tab;
CREATE TABLE tab
AS
SELECT 'A' as col1, 3 AS col2 FROM dual UNION ALL
SELECT 'B' as col1, 7 AS col2 FROM dual UNION ALL
SELECT 'C' as col1, 6 AS col2 FROM dual UNION ALL
SELECT 'D' as col1, 5 AS col2 FROM dual UNION ALL
SELECT 'E' as col1, 9 AS col2 FROM dual UNION ALL
SELECT 'F' as col1, 3 AS col2 FROM dual UNION ALL
SELECT 'G' as col1, 8 AS col2 FROM dual;
实际查询:
WITH cte_r AS (
SELECT t.*, ROW_NUMBER() OVER(ORDER BY t.col1) AS rn FROM tab t
), cte(col1, col2, total, rn) AS (
SELECT col1, col2, col2 AS total, rn
FROM cte_r
WHERE rn = 1
UNION ALL
SELECT cte_r.col1, cte_r.col2,
CASE WHEN cte.total >= 15 THEN 0 ELSE cte.total END + cte_r.col2 AS total,
cte_r.rn
FROM cte
JOIN cte_r
ON cte.rn = cte_r.rn-1
)
SELECT col1, col2, total
FROM cte
ORDER BY rn;
输出:
┌──────┬──────┬───────┐
│ COL1 │ COL2 │ TOTAL │
├──────┼──────┼───────┤
│ A │ 3 │ 3 │
│ B │ 7 │ 10 │
│ C │ 6 │ 16 │
│ D │ 5 │ 5 │
│ E │ 9 │ 14 │
│ F │ 3 │ 17 │
│ G │ 8 │ 8 │
└──────┴──────┴───────┘
此解决方案不仅限于 Oracle,它也适用于其他 RDBMS,例如 SQL Server/PostgreSQL/MySQL 8.0/SQLite 3.25.
作为递归 SQL 的替代方法,您还可以使用 SQL MODEL
子句。就个人而言,我发现这比递归 SQL 更容易阅读,但更难编写(因为大多数人,像我一样,需要查找语法)。
-- "test_data" is just a substitute for your real table, which I don't have
-- it is just so people without your table can run this example and would
-- not be part of your real solution.
with test_data ( sort_col, addend ) as
( SELECT 'A', 3 FROM DUAL UNION ALL
SELECT 'B', 7 FROM DUAL UNION ALL
SELECT 'C', 6 FROM DUAL UNION ALL
SELECT 'D', 5 FROM DUAL UNION ALL
SELECT 'E', 9 FROM DUAL UNION ALL
SELECT 'F', 3 FROM DUAL UNION ALL
SELECT 'G', 8 FROM DUAL ),
-- Solution begins here
sorted_inputs ( sort_col, sort_order, addend, running_sum_max_15) as
( SELECT sort_col, row_number() over ( order by sort_col ) sort_order, addend, 0 from test_data )
SELECT sort_col, addend, running_sum_max_15
from sorted_inputs
model
dimension by (sort_order)
measures ( sort_col, addend, running_sum_max_15 )
rules update
( running_sum_max_15[1] = addend[1],
running_sum_max_15[sort_order>1] =
case when running_sum_max_15[CV(sort_order)-1] < 15 THEN
running_sum_max_15[CV(sort_order)-1] ELSE 0 END+addend[CV(sort_order)]
)
结果
+----------+--------+--------------------+
| SORT_COL | ADDEND | RUNNING_SUM_MAX_15 |
+----------+--------+--------------------+
| A | 3 | 3 |
| B | 7 | 10 |
| C | 6 | 16 |
| D | 5 | 5 |
| E | 9 | 14 |
| F | 3 | 17 |
| G | 8 | 8 |
+----------+--------+--------------------+
有可能比递归 CTE 更容易达到预期的结果。
Oracle 12c支持MATCH_RECOGNIZE
,很适合解决"bin fitting"问题:
SELECT Col1, col2, rolling_sum, bin_num
FROM T
MATCH_RECOGNIZE (
ORDER BY col1
MEASURES SUM(col2) ROLLING_SUM, MATCH_NUMBER() AS bin_num
ALL ROWS PER MATCH
AFTER MATCH SKIP PAST LAST ROW
PATTERN ( A+ )
DEFINE A AS SUM(col2) < 15 + A.col2);
输出:
┌───────┬───────┬──────────────┬─────────┐
│ COL1 │ COL2 │ ROLLING_SUM │ BIN_NUM │
├───────┼───────┼──────────────┼─────────┤
│ A │ 3 │ 3 │ 1 │
│ B │ 7 │ 10 │ 1 │
│ C │ 6 │ 16 │ 1 │
│ D │ 5 │ 5 │ 2 │
│ E │ 9 │ 14 │ 2 │
│ F │ 3 │ 17 │ 2 │
│ G │ 8 │ 8 │ 3 │
└───────┴───────┴──────────────┴─────────┘
额外:Capping a runnig total 和 MODEL
我正在尝试使用条件 SUM 进行查询。 SUM 需要大于 15,然后重置它。像这样:
A | 3 | 3
B | 7 | 10
C | 6 | 16 -- ====
D | 5 | 5
E | 9 | 14
F | 3 | 17 -- ====
G | 8 | 8
我该怎么做?
使用递归 cte:
DROP TABLE tab;
CREATE TABLE tab
AS
SELECT 'A' as col1, 3 AS col2 FROM dual UNION ALL
SELECT 'B' as col1, 7 AS col2 FROM dual UNION ALL
SELECT 'C' as col1, 6 AS col2 FROM dual UNION ALL
SELECT 'D' as col1, 5 AS col2 FROM dual UNION ALL
SELECT 'E' as col1, 9 AS col2 FROM dual UNION ALL
SELECT 'F' as col1, 3 AS col2 FROM dual UNION ALL
SELECT 'G' as col1, 8 AS col2 FROM dual;
实际查询:
WITH cte_r AS (
SELECT t.*, ROW_NUMBER() OVER(ORDER BY t.col1) AS rn FROM tab t
), cte(col1, col2, total, rn) AS (
SELECT col1, col2, col2 AS total, rn
FROM cte_r
WHERE rn = 1
UNION ALL
SELECT cte_r.col1, cte_r.col2,
CASE WHEN cte.total >= 15 THEN 0 ELSE cte.total END + cte_r.col2 AS total,
cte_r.rn
FROM cte
JOIN cte_r
ON cte.rn = cte_r.rn-1
)
SELECT col1, col2, total
FROM cte
ORDER BY rn;
输出:
┌──────┬──────┬───────┐
│ COL1 │ COL2 │ TOTAL │
├──────┼──────┼───────┤
│ A │ 3 │ 3 │
│ B │ 7 │ 10 │
│ C │ 6 │ 16 │
│ D │ 5 │ 5 │
│ E │ 9 │ 14 │
│ F │ 3 │ 17 │
│ G │ 8 │ 8 │
└──────┴──────┴───────┘
此解决方案不仅限于 Oracle,它也适用于其他 RDBMS,例如 SQL Server/PostgreSQL/MySQL 8.0/SQLite 3.25.
作为递归 SQL 的替代方法,您还可以使用 SQL MODEL
子句。就个人而言,我发现这比递归 SQL 更容易阅读,但更难编写(因为大多数人,像我一样,需要查找语法)。
-- "test_data" is just a substitute for your real table, which I don't have
-- it is just so people without your table can run this example and would
-- not be part of your real solution.
with test_data ( sort_col, addend ) as
( SELECT 'A', 3 FROM DUAL UNION ALL
SELECT 'B', 7 FROM DUAL UNION ALL
SELECT 'C', 6 FROM DUAL UNION ALL
SELECT 'D', 5 FROM DUAL UNION ALL
SELECT 'E', 9 FROM DUAL UNION ALL
SELECT 'F', 3 FROM DUAL UNION ALL
SELECT 'G', 8 FROM DUAL ),
-- Solution begins here
sorted_inputs ( sort_col, sort_order, addend, running_sum_max_15) as
( SELECT sort_col, row_number() over ( order by sort_col ) sort_order, addend, 0 from test_data )
SELECT sort_col, addend, running_sum_max_15
from sorted_inputs
model
dimension by (sort_order)
measures ( sort_col, addend, running_sum_max_15 )
rules update
( running_sum_max_15[1] = addend[1],
running_sum_max_15[sort_order>1] =
case when running_sum_max_15[CV(sort_order)-1] < 15 THEN
running_sum_max_15[CV(sort_order)-1] ELSE 0 END+addend[CV(sort_order)]
)
结果
+----------+--------+--------------------+
| SORT_COL | ADDEND | RUNNING_SUM_MAX_15 |
+----------+--------+--------------------+
| A | 3 | 3 |
| B | 7 | 10 |
| C | 6 | 16 |
| D | 5 | 5 |
| E | 9 | 14 |
| F | 3 | 17 |
| G | 8 | 8 |
+----------+--------+--------------------+
有可能比递归 CTE 更容易达到预期的结果。
Oracle 12c支持MATCH_RECOGNIZE
,很适合解决"bin fitting"问题:
SELECT Col1, col2, rolling_sum, bin_num
FROM T
MATCH_RECOGNIZE (
ORDER BY col1
MEASURES SUM(col2) ROLLING_SUM, MATCH_NUMBER() AS bin_num
ALL ROWS PER MATCH
AFTER MATCH SKIP PAST LAST ROW
PATTERN ( A+ )
DEFINE A AS SUM(col2) < 15 + A.col2);
输出:
┌───────┬───────┬──────────────┬─────────┐
│ COL1 │ COL2 │ ROLLING_SUM │ BIN_NUM │
├───────┼───────┼──────────────┼─────────┤
│ A │ 3 │ 3 │ 1 │
│ B │ 7 │ 10 │ 1 │
│ C │ 6 │ 16 │ 1 │
│ D │ 5 │ 5 │ 2 │
│ E │ 9 │ 14 │ 2 │
│ F │ 3 │ 17 │ 2 │
│ G │ 8 │ 8 │ 3 │
└───────┴───────┴──────────────┴─────────┘
额外:Capping a runnig total 和 MODEL