来OB这么久还没有接触啥金融的SQL,只能发点其他行业的数据库SQL优化案例。😂
今天拿到手的这个案例SQL 传统行业的,很奇葩的SQL,表设计三范式都没弄好。
什么医疗,交通,能源这些传统行业的业务设计,SQL语句最奇葩了,也挺好玩的,有挑战性。
慢SQL:
SELECT LI.STATUS, FI.SOFL_SEQ_NR ,PI.CLAZZ,PI.HV_TYPE
FROM LNF LI, PNF PI, FNF FI
WHERE 1=1
AND LI.ALN_CD = DECODE(FI.ALN_CD, 'OQ', 'CZ', FI.ALN_CD)
and li.dep_arp_cd = fi.act_dep_cd
and li.flt_nr = DECODE(fi.aln_cd,'OQ',substr(( select cz_flt_nr from OQ_FLT_INFO oq where substr(oq.oq_flt_nr,3,4)= fi.flt_nr) ,3,4), fi.flt_nr)
and li.FLT_DT=FI.FLT_DT
AND LI.FK_PSGR_ID = PI.PSGR_ID
AND (PI.HV_TYPE IS NOT NULL OR PI.CLAZZ IN ('F', 'F1', 'J', 'C', 'D', 'I', 'O'))
and FI.FLT_DT=date'2024-04-01'
and FI.SCH_DEP_CD='CAN'
ORDER BY FI.SOFL_SEQ_NR ;
执行时间:
执行计划(看不看得懂随缘、反正我没看):
1 #NSET2: [2903, 556029, 632]
2 #PIPE2: [2903, 556029, 632]
3 #PIPE2: [2901, 556029, 632]
4 #PRJT2: [2899, 556029, 632]; exp_num(4), is_atom(FALSE)
5 #SORT3: [2899, 556029, 632]; key_num(1), is_distinct(FALSE), top_flag(0), is_adaptive(0)
6 #UNION FOR OR2: [2788, 556029, 632]; key_num(0), outer_join(-)
7 #SLCT2: [1334, 278014, 632]; LI.FLT_NR = exp_simple_case
8 #HASH2 INNER JOIN: [1334, 278014, 632]; KEY_NUM(2); KEY(FI.ACT_DEP_CD=LI.DEP_ARP_CD AND exp_simple_case=LI.ALN_CD) KEY_NULL_EQU(0, 0)
9 #BLKUP2: [1, 385, 247]; IDX_FLIGHT_INFO02(FI)
10 #SSEK2: [1, 385, 247]; scan_type(ASC), IDX_FLIGHT_INFO02(FNF as FI), scan_range[(exp_cast(2024-04-01),'CAN',min),(exp_cast(2024-04-01),'CAN',max))
11 #SLCT2: [1324, 37479, 385]; NOT(PI.HV_TYPE IS NULL)
12 #HASH2 INNER JOIN: [1324, 37479, 385]; RKEY_UNIQUE KEY_NUM(1); KEY(LI.FK_PSGR_ID=PI.PSGR_ID) KEY_NULL_EQU(0)
13 #SLCT2: [1324, 37479, 385]; NOT(PI.HV_TYPE IS NULL)
14 #NEST LOOP INDEX JOIN2: [1324, 37479, 385]
15 #ACTRL: [1324, 37479, 385];
16 #BLKUP2: [1049, 37479, 247]; INDEX_LU_INTO_TAG_0416(LI)
17 #SLCT2: [1049, 37479, 247]; LI.FLT_DT = var3
18 #SSCN: [1049, 37479, 247]; INDEX_LU_INTO_TAG_0416(LNF as LI); btr_scan(1)
19 #BLKUP2: [244, 1, 30]; INDEX33555482(PI)
20 #SSEK2: [244, 1, 30]; scan_type(ASC), INDEX33555482(PNF as PI), scan_range[LI.FK_PSGR_ID,LI.FK_PSGR_ID]
21 #CSCN2: [475, 3573399, 138]; INDEX33555481(PNF as PI); btr_scan(1)
22 #SLCT2: [1334, 278014, 632]; LI.FLT_NR = exp_simple_case
23 #HASH2 INNER JOIN: [1334, 278014, 632]; KEY_NUM(2); KEY(FI.ACT_DEP_CD=LI.DEP_ARP_CD AND exp_simple_case=LI.ALN_CD) KEY_NULL_EQU(0, 0)
24 #BLKUP2: [1, 385, 247]; IDX_FLIGHT_INFO02(FI)
25 #SSEK2: [1, 385, 247]; scan_type(ASC), IDX_FLIGHT_INFO02(FNF as FI), scan_range[(exp_cast(2024-04-01),'CAN',min),(exp_cast(2024-04-01),'CAN',max))
26 #SLCT2: [1324, 37479, 385]; (exp11 AND PI.CLAZZ IN LIST)
27 #HASH2 INNER JOIN: [1324, 37479, 385]; RKEY_UNIQUE KEY_NUM(1); KEY(LI.FK_PSGR_ID=PI.PSGR_ID) KEY_NULL_EQU(0)
28 #SLCT2: [1324, 37479, 385]; (exp11 AND PI.CLAZZ IN LIST)
29 #NEST LOOP INDEX JOIN2: [1324, 37479, 385]
30 #ACTRL: [1324, 37479, 385];
31 #BLKUP2: [1049, 37479, 247]; INDEX_LU_INTO_TAG_0416(LI)
32 #SLCT2: [1049, 37479, 247]; LI.FLT_DT = var4
33 #SSCN: [1049, 37479, 247]; INDEX_LU_INTO_TAG_0416(LNF as LI); btr_scan(1)
34 #BLKUP2: [244, 1, 30]; INDEX33555482(PI)
35 #SSEK2: [244, 1, 30]; scan_type(ASC), INDEX33555482(PNF as PI), scan_range[LI.FK_PSGR_ID,LI.FK_PSGR_ID]
36 #CSCN2: [475, 3573399, 138]; INDEX33555481(PNF as PI); btr_scan(1)
37 #SPL2: [1, 279, 343]; key_num(2), spool_num(1), is_atom(FALSE), has_var(0), sites(-)
38 #PRJT2: [1, 279, 343]; exp_num(2), is_atom(FALSE)
39 #HASH2 INNER JOIN: [1, 279, 343]; KEY_NUM(1); KEY(exp11=FI.FLT_NR) KEY_NULL_EQU(0)
40 #CSCN2: [1, 279, 96]; INDEX33555478(OQ_FLT_INFO as OQ); btr_scan(1)
41 #BLKUP2: [1, 385, 247]; IDX_FLIGHT_INFO02(FI)
42 #SSEK2: [1, 385, 247]; scan_type(ASC), IDX_FLIGHT_INFO02(FNF as FI), scan_range[(exp_cast(2024-04-01),'CAN',min),(exp_cast(2024-04-01),'CAN',max))
43 #SPL2: [1, 279, 343]; key_num(2), spool_num(0), is_atom(FALSE), has_var(0), sites(-)
44 #PRJT2: [1, 279, 343]; exp_num(2), is_atom(FALSE)
45 #HASH2 INNER JOIN: [1, 279, 343]; KEY_NUM(1); KEY(exp11=FI.FLT_NR) KEY_NULL_EQU(0)
46 #CSCN2: [1, 279, 96]; INDEX33555478(OQ_FLT_INFO as OQ); btr_scan(1)
47 #BLKUP2: [1, 385, 247]; IDX_FLIGHT_INFO02(FI)
48 #SSEK2: [1, 385, 247]; scan_type(ASC), IDX_FLIGHT_INFO02(FNF as FI), scan_range[(exp_cast(2024-04-01),'CAN',min),(exp_cast(2024-04-01),'CAN',max))
表数据量:
上面SQL跑28秒,返回8行数据,还是挺慢的。
DM哥们说他已经加个HINT对 or 进行整体优化,但是还要跑12秒,客户不接受,所以找到我来看看。😅
加HINT优化方案:
SELECT /*+ OPTIMIZER_OR_NBEXP(2) */ LI.STATUS, FI.SOFL_SEQ_NR ,PI.CLAZZ,PI.HV_TYPE
FROM LNF LI, PNF PI, FNF FI
WHERE 1=1
AND LI.ALN_CD = DECODE(FI.ALN_CD, 'OQ', 'CZ', FI.ALN_CD)
and li.dep_arp_cd = fi.act_dep_cd
and li.flt_nr = DECODE(fi.aln_cd,'OQ',substr(( select cz_flt_nr from OQ_FLT_INFO oq where substr(oq.oq_flt_nr,3,4)= fi.flt_nr) ,3,4), fi.flt_nr)
and li.FLT_DT=FI.FLT_DT
AND LI.FK_PSGR_ID = PI.PSGR_ID
AND (PI.HV_TYPE IS NOT NULL OR PI.CLAZZ IN ('F', 'F1', 'J', 'C', 'D', 'I', 'O'))
and FI.FLT_DT=date'2024-04-01'
and FI.SCH_DEP_CD='CAN'
ORDER BY FI.SOFL_SEQ_NR ;
加HINT后执行计划:
1 #NSET2: [1372, 278014, 608]
2 #PIPE2: [1372, 278014, 608]
3 #PRJT2: [1371, 278014, 608]; exp_num(4), is_atom(FALSE)
4 #SORT3: [1371, 278014, 608]; key_num(1), is_distinct(FALSE), top_flag(0), is_adaptive(0)
5 #SLCT2: [1317, 278014, 608]; LI.FLT_NR = exp_simple_case
6 #HASH2 INNER JOIN: [1317, 278014, 608]; KEY_NUM(2); KEY(FI.ACT_DEP_CD=LI.DEP_ARP_CD AND exp_simple_case=LI.ALN_CD) KEY_NULL_EQU(0, 0)
7 #BLKUP2: [1, 385, 247]; IDX_FLIGHT_INFO02(FI)
8 #SSEK2: [1, 385, 247]; scan_type(ASC), IDX_FLIGHT_INFO02(FNF as FI), scan_range[(exp_cast(2024-04-01),'CAN',min),(exp_cast(2024-04-01),'CAN',max))
9 #SLCT2: [1307, 37479, 361]; (NOT(PI.HV_TYPE IS NULL) OR PI.CLAZZ IN LIST)
10 #HASH2 INNER JOIN: [1307, 37479, 361]; RKEY_UNIQUE KEY_NUM(1); KEY(LI.FK_PSGR_ID=PI.PSGR_ID) KEY_NULL_EQU(0)
11 #SLCT2: [1307, 37479, 361]; (NOT(PI.HV_TYPE IS NULL) OR PI.CLAZZ IN LIST)
12 #NEST LOOP INDEX JOIN2: [1307, 37479, 361]
13 #ACTRL: [1307, 37479, 361];
14 #BLKUP2: [1032, 37479, 235]; INDEX_LU_INTO_TAG_0416(LI)
15 #SLCT2: [1032, 37479, 235]; LI.FLT_DT = var2
16 #SSCN: [1032, 37479, 235]; INDEX_LU_INTO_TAG_0416(LNF as LI); btr_scan(1)
17 #BLKUP2: [244, 1, 30]; INDEX33555482(PI)
18 #SSEK2: [244, 1, 30]; scan_type(ASC), INDEX33555482(PNF as PI), scan_range[LI.FK_PSGR_ID,LI.FK_PSGR_ID]
19 #CSCN2: [467, 3573399, 126]; INDEX33555481(PNF as PI); btr_scan(1)
20 #SPL2: [1, 279, 343]; key_num(2), spool_num(0), is_atom(FALSE), has_var(0), sites(-)
21 #PRJT2: [1, 279, 343]; exp_num(2), is_atom(FALSE)
22 #HASH2 INNER JOIN: [1, 279, 343]; KEY_NUM(1); KEY(exp11=FI.FLT_NR) KEY_NULL_EQU(0)
23 #CSCN2: [1, 279, 96]; INDEX33555478(OQ_FLT_INFO as OQ); btr_scan(1)
24 #BLKUP2: [1, 385, 247]; IDX_FLIGHT_INFO02(FI)
25 #SSEK2: [1, 385, 247]; scan_type(ASC), IDX_FLIGHT_INFO02(FNF as FI), scan_range[(exp_cast(2024-04-01),'CAN',min),(exp_cast(2024-04-01),'CAN',max))
HINT 执行时间:
12秒对原来的28秒来说已经提升了很大的空间,但是客户表示不满意:ORACLE能秒出结果,到了达梦以后执行时间多了12倍,接受不了。😅
无解,最后找到哥,看看能不能帮他让这条SQL"秒出结果"。😎
简单看了看,加索引和使用HINT都不好使,只能等价改写了,再创建合适的索引,让这条SQL走上新的索引。
等价改写 + 索引优化方案:
SELECT LI.STATUS,
FI.SOFL_SEQ_NR,
PI.CLAZZ,
PI.HV_TYPE
FROM LNF LI
INNER JOIN (SELECT ACT_DEP_CD,
FLT_DT,
SOFL_SEQ_NR,
DECODE(ALN_CD, 'OQ', 'CZ', ALN_CD) V1,
DECODE(ALN_CD, 'OQ', SUBSTR(
(SELECT CZ_FLT_NR FROM OQ_FLT_INFO OQ WHERE SUBSTR(OQ.OQ_FLT_NR, 3, 4) = FLT_NR), 3,
4), FLT_NR) V2
FROM FNF
WHERE FLT_DT = DATE'2024-04-01'
AND SCH_DEP_CD = 'CAN'
AND ROWNUM > 0) FI
ON LI.DEP_ARP_CD = FI.ACT_DEP_CD AND LI.FLT_DT = FI.FLT_DT AND LI.ALN_CD = FI.V1 AND
LI.FLT_NR = FI.V2
INNER JOIN (WITH PI AS (SELECT PSGR_ID, HV_TYPE, CLAZZ
FROM PNF)
SELECT DISTINCT PSGR_ID, HV_TYPE, CLAZZ
FROM (SELECT PSGR_ID, HV_TYPE, CLAZZ
FROM PI
WHERE (PI.HV_TYPE IS NOT NULL)
UNION ALL
SELECT PSGR_ID, HV_TYPE, CLAZZ
FROM PI
WHERE PI.CLAZZ IN ('F', 'F1', 'J', 'C', 'D', 'I', 'O'))) PI ON LI.FK_PSGR_ID = PI.PSGR_ID
ORDER BY FI.SOFL_SEQ_NR;
-- 加索引:
create index idx_pi_1_2 on PNF( PSGR_ID,CLAZZ,HV_TYPE );
create index idx_fi_1_2 on FNF ( act_dep_cd,FLT_DT );
CREATE index idx_1_2_3_FI on FNF(FLT_DT,SCH_DEP_CD,act_dep_cd,SOFL_SEQ_NR);
CREATE index idx_1_2_3_li on LNF(ALN_CD,dep_arp_cd,flt_nr,FLT_DT,FK_PSGR_ID,STATUS);
CREATE index idx_1_2_3 on FNF(FLT_DT,SCH_DEP_CD);
优化后执行计划:
#NSET2: [821, 385, 596]
2 #PIPE2: [821, 385, 596]
3 #PRJT2: [821, 385, 596]; exp_num(4), is_atom(FALSE)
4 #SORT3: [821, 385, 596]; key_num(1), is_distinct(FALSE), top_flag(0), is_adaptive(0)
5 #SLCT2: [820, 385, 596]; LI.FK_PSGR_ID = PI.PSGR_ID
6 #NEST LOOP INNER JOIN2: [820, 385, 596]; [with var]
7 #HASH2 INNER JOIN: [2, 385, 470]; KEY_NUM(4); KEY(FI.ACT_DEP_CD=LI.DEP_ARP_CD AND FI.FLT_DT=LI.FLT_DT AND FI.V1=LI.ALN_CD AND FI.V2=LI.FLT_NR) KEY_NULL_EQU(0, 0, 0, 0)
8 #NEST LOOP INDEX JOIN2: [2, 385, 470]
9 #ACTRL: [2, 385, 470];
10 #PRJT2: [1, 385, 235]; exp_num(5), is_atom(FALSE)
11 #RN: [1, 385, 235]
12 #BLKUP2: [1, 385, 235]; IDX_FLIGHT_INFO02(FNF)
13 #SSEK2: [1, 385, 235]; scan_type(ASC), IDX_FLIGHT_INFO02(FNF), scan_range[(exp_cast(2024-04-01),'CAN',min),(exp_cast(2024-04-01),'CAN',max))
14 #SSEK2: [1, 1, 235]; scan_type(ASC), IDX_1_2_3_LI(LNF as LI), scan_range[(FI.V1,FI.ACT_DEP_CD,FI.V2,FI.FLT_DT,min,min),(FI.V1,FI.ACT_DEP_CD,FI.V2,FI.FLT_DT,max,max))
15 #SSCN: [989, 6461936, 235]; IDX_1_2_3_LI(LNF as LI); btr_scan(1)
16 #PRJT2: [2, 1, 126]; exp_num(3), is_atom(FALSE)
17 #DISTINCT: [2, 1, 126]
18 #PRJT2: [1, 2, 126]; exp_num(3), is_atom(FALSE)
19 #UNION ALL: [1, 2, 126]
20 #PRJT2: [1, 1, 126]; exp_num(3), is_atom(FALSE)
21 #SLCT2: [1, 1, 126]; NOT(PNF.HV_TYPE IS NULL)
22 #BLKUP2: [1, 1, 126]; INDEX33555482(PNF)
23 #SSEK2: [1, 1, 126]; scan_type(ASC), INDEX33555482(PNF), scan_range[var4,var4]
24 #PRJT2: [1, 1, 126]; exp_num(3), is_atom(FALSE)
25 #HASH RIGHT SEMI JOIN2: [1, 1, 126]; n_keys(1) KEY(DMTEMPVIEW_889228539.colname=PNF.CLAZZ) KEY_NULL_EQU(0)
26 #CONST VALUE LIST: [1, 7, 48]; row_num(7), col_num(1)
27 #BLKUP2: [1, 1, 126]; INDEX33555482(PNF)
28 #SSEK2: [1, 1, 126]; scan_type(ASC), INDEX33555482(PNF), scan_range[var4,var4]
29 #SPL2: [1, 1, 96]; key_num(1), spool_num(0), is_atom(TRUE), has_var(1), sites(-)
30 #PRJT2: [1, 1, 96]; exp_num(1), is_atom(TRUE)
31 #BLKUP2: [1, 6, 96]; INDEX33555479(OQ)
32 #SLCT2: [1, 6, 96]; var3 = exp11
33 #SSCN: [1, 6, 96]; INDEX33555479(OQ_FLT_INFO as OQ); btr_scan(1)
执行时间:
通过改写+创建索引优化后,能做到像ORACLE这样,真"秒出结果"。😺
堆表和索引组织表的区别还是蛮大的,以前的老系统,业务SQL写得烂,用堆表跑问题不大,Oracle cbo算法牛逼也抗得住。
**但是现在很多国产数据库都是使用索引组织表(IOT表 ),例如 **OB、DM、TIDB 等国产数据库。
由于IOT表的特性在使用场景来说,对些老系统来说并不友好(老系统业务设计随意、业务逻辑较多在数据库层面实现),所以会产生很多性能问题: ORACLE 的索引都迁移到国产数据库了,性能还这么差,为什么没用上原来的索引啥的,等等诸如此类的问题。
要做国产化适配改造,并不能满足数据库功能、特性上的实现,业务模型也要配合整体来进行改造。
感谢各位读者同学能看到这里,如果有一些奇葩的SQL问题也可以联系我。🥰🥰** 🥰**