行具有LEAD / LAG功能的列

时间:2014-12-13 20:42:49

标签: sql oracle oracle11g window-functions

我想获得帮助以获得Oracle 11gR2的特定结果。

首先,我需要从Table" RAW_DATA"开始。像这样安排:

CREATE TABLE RAW_DATA
AS
SELECT 'MTL' AS EMH_CED,'ATW 25-55' AS EMH_ID,to_date('2014-12-03 17:17:10','yyyy-mm-dd hh24:mi:ss') AS EMH_DATE_HEURE,'AM' AS EMH_TYPE_MESURE,'A' AS EMH_PHASE,75 AS EMH_MESURE FROM dual union ALL
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:10','yyyy-mm-dd hh24:mi:ss'),'AM','B',100 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:10','yyyy-mm-dd hh24:mi:ss'),'AM','C',98 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:29','yyyy-mm-dd hh24:mi:ss'),'AM','A',75 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:29','yyyy-mm-dd hh24:mi:ss'),'AM','B',100 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:29','yyyy-mm-dd hh24:mi:ss'),'AM','C',98 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:57','yyyy-mm-dd hh24:mi:ss'),'AM','A',84 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:57','yyyy-mm-dd hh24:mi:ss'),'AM','B',100 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-03 17:17:57','yyyy-mm-dd hh24:mi:ss'),'AM','C',98 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 00:00:00','yyyy-mm-dd hh24:mi:ss'),'AM','B',91 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 00:00:00','yyyy-mm-dd hh24:mi:ss'),'AM','C',89 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 15:06:07','yyyy-mm-dd hh24:mi:ss'),'AM','A',0 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 15:06:07','yyyy-mm-dd hh24:mi:ss'),'AM','B',0 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 15:06:07','yyyy-mm-dd hh24:mi:ss'),'AM','C',0 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:22:37','yyyy-mm-dd hh24:mi:ss'),'AM','A',23 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:22:37','yyyy-mm-dd hh24:mi:ss'),'AM','B',24 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:22:37','yyyy-mm-dd hh24:mi:ss'),'AM','C',24 FROM dual union ALL
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:27:36','yyyy-mm-dd hh24:mi:ss'),'AM','A',34 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:27:43','yyyy-mm-dd hh24:mi:ss'),'AM','B',40 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:27:43','yyyy-mm-dd hh24:mi:ss'),'AM','C',39 FROM dual union ALL
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:28:12','yyyy-mm-dd hh24:mi:ss'),'AM','A',51 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:28:12','yyyy-mm-dd hh24:mi:ss'),'AM','B',58 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:28:12','yyyy-mm-dd hh24:mi:ss'),'AM','C',57 FROM dual union ALL
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:40:33','yyyy-mm-dd hh24:mi:ss'),'AM','B',80 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:40:33','yyyy-mm-dd hh24:mi:ss'),'AM','C',78 FROM dual union ALL
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:41:02','yyyy-mm-dd hh24:mi:ss'),'AM','A',73 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:47:10','yyyy-mm-dd hh24:mi:ss'),'AM','A',83 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:55:39','yyyy-mm-dd hh24:mi:ss'),'AM','B',98 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:27:59','yyyy-mm-dd hh24:mi:ss'),'AM','A',0 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:27:59','yyyy-mm-dd hh24:mi:ss'),'AM','B',0 FROM dual union ALL 
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:27:59','yyyy-mm-dd hh24:mi:ss'),'AM','C',0 FROM dual union ALL
SELECT 'MTL','ATW 25-55',to_date('2014-12-04 16:56:37','yyyy-mm-dd hh24:mi:ss'),'AM','C',96 FROM dual;

我正在寻找的最终结果如下:

我需要在一个数据阵列上拥有" EMH_MESURE"对于" EMH_PHASE"的每个值; (" A"," B"和" C")。该结果需要存储在三个新列中,分别命名为" MESURE_A"," MESURE_B"和" MESURE_C"。

之后,我需要在零交叉之前和之后的数据流(这是MESURE_A=MESURE_B=MESURE_C=0时," RAW_DATA"按" EMH_DATE_HEURE")排序。我还需要与零交叉相对应的数据行。在我的背景下,可能有几个过零点。然后,基于表" RAW_DATA",我想得到的结果如下:

EMH_CED, EMH_ID,     EMH_DATE_HEURE,     EMH_TYPE_MESURE, MESURE_A, MESURE_B, MESURE_C
MTL      ATW 25-55   2014-12-04 00:00:00       AM              84        91        89
MTL      ATW 25-55   2014-12-04 15:06:07       AM               0         0         0
MTL      ATW 25-55   2014-12-04 16:22:37       AM              23        24        24
MTL      ATW 25-55   2014-12-04 16:27:43       AM              34        40        39
MTL      ATW 25-55   2014-12-04 16:27:59       AM               0         0         0
MTL      ATW 25-55   2014-12-04 16:28:12       AM              51        58        57

所以,我首先改变了专栏" EMH_PHASE"来自" RAW_DATA"使用下面的代码进入3个区别列(" MESURE_A"," MESURE_B"和" MESURE_C")。

WITH ROWS_TO_COLUMNS AS(
  SELECT EMH_CED
    ,EMH_ID
    ,EMH_DATE_HEURE
    ,EMH_TYPE_MESURE
   , MAX(decode(EMH_PHASE,'A', EMH_MESURE, null)) AS MESURE_A
   , MAX(decode(EMH_PHASE,'B', EMH_MESURE, null)) AS MESURE_B
   , MAX(decode(EMH_PHASE,'C', EMH_MESURE, null)) AS MESURE_C
FROM RAW_DATA
GROUP BY EMH_CED, EMH_ID, EMH_DATE_HEURE, EMH_TYPE_MESURE
)

到目前为止,它似乎做了我想要的,但我得到了一些无关的空值。

然后,我使用以下代码填充每个值之前的值:

NULLS_FILLED AS(
  SELECT EMH_CED, EMH_ID, EMH_DATE_HEURE
   ,FIRST_VALUE(MESURE_A) IGNORE NULLS
       OVER (PARTITION BY EMH_CED, EMH_ID ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC
         RANGE BETWEEN CURRENT ROW AND UNBOUNDED FOLLOWING) AS MESURE_A
   ,FIRST_VALUE(MESURE_B) IGNORE NULLS
       OVER (PARTITION BY EMH_CED, EMH_ID ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC
         RANGE BETWEEN CURRENT ROW AND UNBOUNDED FOLLOWING) AS MESURE_B
   ,FIRST_VALUE(MESURE_C) IGNORE NULLS
       OVER (PARTITION BY EMH_CED, EMH_ID ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC
         RANGE BETWEEN CURRENT ROW AND UNBOUNDED FOLLOWING) AS MESURE_C
FROM ROWS_TO_COLUMNS
ORDER BY EMH_DATE_HEURE
)

该操作后的结果是我在开始时寻找的结果。

下一步是我需要帮助的地方。我想在MESURE_A=MESURE_B=MESURE_C=0时只获取LEADing和LAGing行(我也需要显示此行)。

现在,我只能获得LAGing行,以及表格的最后一行,我甚至不想要。我仍然需要找到一种方法来摆脱我失去的2行,而不是我想要的那一行。

到目前为止,我尝试了不同的事情而没有任何好的结果。帮助

以下是我的其余代码,需要进行调整以获得所需的结果:

,RN_DATA AS(
   SELECT NULLS_FILLED.*, row_number() over (order by EMH_CED, EMH_ID, EMH_DATE_HEURE) AS rn
FROM NULLS_FILLED
)

,DATA_GROUPED AS (
   SELECT RN_DATA.*, rownum - rn AS grp
FROM RN_DATA
WHERE MESURE_A>0 AND MESURE_B>0 AND MESURE_C>0
)

SELECT max(EMH_CED) keep (dense_rank first ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC) AS EMH_CED
  ,max(EMH_ID) keep (dense_rank first ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC) AS EMH_ID
  ,max(EMH_DATE_HEURE) keep (dense_rank first ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC) AS EMH_DATE_HEURE
  ,max(MESURE_A) keep (dense_rank first ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC) AS MESURE_A
  ,max(MESURE_B) keep (dense_rank first ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC) AS MESURE_B
  ,max(MESURE_C) keep (dense_rank first ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC) AS MESURE_C
  ,max(rn) keep (dense_rank first ORDER BY EMH_CED, EMH_ID, EMH_DATE_HEURE DESC) AS rn
FROM DATA_GROUPED
GROUP BY grp
ORDER BY rn
;

随意使用SQL Fiddle测试我的代码: http://sqlfiddle.com/#!4/e6b2e0/4/0

1 个答案:

答案 0 :(得分:1)

我不明白你为什么使用ROW_NUMBER,FIRST,LAST函数。您只需使用LEAD, LAG函数。

WITH rows_to_columns AS
(
         SELECT   emh_ced,
                  emh_id,
                  emh_date_heure,
                  emh_type_mesure,
                  Max (
                  CASE emh_phase
                           WHEN 'A' THEN emh_mesure
                  END) AS mesure_a,
                  Max (
                  CASE emh_phase
                           WHEN 'B' THEN emh_mesure
                  END) AS mesure_b,
                  Max (
                  CASE emh_phase
                           WHEN 'C' THEN emh_mesure
                  END) AS mesure_c
         FROM     raw_data
         GROUP BY emh_ced,
                  emh_id,
                  emh_date_heure,
                  emh_type_mesure), nulls_filled AS
(
         SELECT   emh_ced,
                  emh_id,
                  emh_date_heure,
                  emh_type_mesure,
                  First_value ( mesure_a) ignore nulls over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure DESC RANGE BETWEEN CURRENT ROW AND      unbounded following) AS mesure_a,
                  first_value ( mesure_b) ignore nulls over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure DESC RANGE BETWEEN CURRENT ROW AND      unbounded following) AS mesure_b,
                  first_value ( mesure_c) ignore nulls over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure DESC RANGE BETWEEN CURRENT ROW AND      unbounded following) AS mesure_c,
                  lead ( mesure_a, 1) over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure)                                                                                 lead_a,
                  lead ( mesure_b, 1) over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure)                                                                                 lead_b,
                  lead ( mesure_c, 1) over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure)                                                                                 lead_c,
                  lag ( mesure_a, 1) over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure)                                                                                  lag_a,
                  lag ( mesure_b, 1) over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure)                                                                                  lag_b,
                  lag ( mesure_c, 1) over (PARTITION BY emh_ced, emh_id ORDER BY emh_ced, emh_id, emh_date_heure)                                                                                  lag_c
         FROM     rows_to_columns)
SELECT   emh_ced,
         emh_id,
         emh_date_heure,
         emh_type_mesure,
         mesure_a,
         mesure_b,
         mesure_c
FROM     nulls_filled
WHERE    (
                  mesure_a = 0
         AND      mesure_b = 0
         AND      mesure_c = 0)
OR       (
                  lead_a = 0
         AND      lead_b = 0
         AND      lead_c = 0)
OR       (
                  lag_a = 0
         AND      lag_b = 0
         AND      lag_c = 0)
ORDER BY 3;

Output:

| EMH_CED |    EMH_ID |                  EMH_DATE_HEURE | EMH_TYPE_MESURE | MESURE_A | MESURE_B | MESURE_C |
|---------|-----------|---------------------------------|-----------------|----------|----------|----------|
|     MTL | ATW 25-55 | December, 04 2014 00:00:00+0000 |              AM |       84 |       91 |       89 |
|     MTL | ATW 25-55 | December, 04 2014 15:06:07+0000 |              AM |        0 |        0 |        0 |
|     MTL | ATW 25-55 | December, 04 2014 16:22:37+0000 |              AM |       23 |       24 |       24 |
|     MTL | ATW 25-55 | December, 04 2014 16:27:43+0000 |              AM |       34 |       40 |       39 |
|     MTL | ATW 25-55 | December, 04 2014 16:27:59+0000 |              AM |        0 |        0 |        0 |
|     MTL | ATW 25-55 | December, 04 2014 16:28:12+0000 |              AM |       51 |       58 |       57 |