[oracle性能优化]sql调优基础

作者：我的饭桶女神 | 来源：互联网 | 2023-10-15 19:16

不会根据执行计划进行sql调优的dba是不合格的，sqltuning是基本技能0.优化器的基本概念为sql语句找到最好的，执行成本最低的执行计划制定执行计划是以sq

不会根据执行计划进行sql调优的dba是不合格的，sql tuning是基本技能

0. 优化器的基本概念

为sql语句找到最好的，执行成本最低的执行计划
制定执行计划是以sql语句中涉及到的对象的统计信息为基础的。

1. 统计信息的介绍

    --表的统计信息（user_tables, user_tab_statistics）

    select num_rows, --表中的记录数
    blocks, --表中数据所占的数据块数
    empty_blocks, --表中的空块数
    avg_space, --数据块中平均的使用空间
    chain_cnt, --表中行连接和行迁移的数量
    avg_row_len, --每条记录的平均长度
    last_analyzed -- 最近一次搜集统计信息的时间
    from user_tables where table_name='new_sales';

    --搜集表的统计信息
    exec dbms_stats.gather_table_stats('sh','new_sales');

    --再来执行一次
    select num_rows, --表中的记录数
    blocks, --表中数据所占的数据块数
    empty_blocks, --表中的空块数
    avg_space, --数据块中平均的使用空间
    chain_cnt, --表中行连接和行迁移的数量
    avg_row_len, --每条记录的平均长度
    last_analyzed -- 最近一次搜集统计信息的时间
    from user_tables where table_name='new_sales';


     --列的统计信息 (user_tab_columns, user_tab_col_statistics,user_tab_histograms)
     select column_name,
     num_distinct, --唯一值的个数
     low_value, --列上的最小值
     high_value, --列上的最大值
     density, --选择率因子（密度） = 1/(ndv),如果不存在柱状图的话
     num_nulls, --空值的个数
     num_buckets, --直方图的bucket个数
     histogram --直方图的类型
     from user_tab_columns
     where table_name='new_sales'

     --搜集柱状图
     exec dbms_stats.gather_table_stats('sh', 'new_sales', method_opt => 'for all columns size 1 for columns size 254 cust_id');


     --再来看看统计信息
     select column_name,
     num_distinct, --唯一值的个数
     low_value, --列上的最小值
     high_value, --列上的最大值
     density, --选择率因子（密度） = 1/(ndv),如果不存在柱状图的话
     num_nulls, --空值的个数
     num_buckets, --直方图的bucket个数
     histogram --直方图的类型
     from user_tab_columns
     where table_name='new_sales'

     select
     column_name,
     endpoint_number,
     endpoint_value,
     from user_tab_histograms
     where table_name='new_sales' and column_name='cust_id'


    扩展统计信息 (user_stat_extensions)
     select e.extension col_group, t.num_distinct, t.histogram
     from user_stat_extensions e, user_tab_col_statistics t
     where e.extension_name=t.column_name
     and t.table_name='new_sales';

     --搜集扩展统计信息
     declare
        cg_name varchar2(30);
     begin
        cg_name := dbms_stats.create_extended_stats('sh','new_sales','(prod_id,cust_id)');
     end;

select sys.dbms_stats.show_extended_stats_name('sh','new_sales', '(prod_id,cust_id)') col_group_name
from dual;

    exec dbms_stats.gather_table_stats('sh','new_sales', method_opt => -
     'for columns (prod_id,cust_id) size skewonly');

2.统计信息不准确容易导致的问题

表统计信息不准确
    导致了表的访问方式出现了问题(全表扫描和使用索引)
    导致了表和表的链接方式出现问题（应该使用hash join，却是用了nest loop）


列统计信息不准确
    导致了访问表的方式不同（错误的索引）
    导致了表的连接方式不同（应该使用hash join , 但是使用了nest loop）

索引的统计信息不准确
导致了访问表的方式不同（应该使用索引，但是使用了全表扫描）

+++++++++++++++++++++++++++++++++++++++++++

--当天线上表

create table sales_online

(
prod_id      number not null ,
cust_id       number not null,

time_id      date not null,

channel_id     number not null,

promo_id       number not null,

quantity_sold number(10,2) not null,

amount_sold    number(10,2) not null)

--历史归档表

create table sales_part (
prod_id      number not null ,
cust_id       number not null,

time_id      date not null,

channel_id     number not null,

promo_id       number not null,

quantity_sold number(10,2) not null,

amount_sold    number(10,2) not null)

partition by range (time_id)

(

partition part_20171218 values less than (to_date('19-12-2017','dd-mm-yyyy')),

partition part_20171219 values less than (to_date('20-12-2017','dd-mm-yyyy'))

);

insert into sales_part

select prod_id,cust_id, sysdate-2,channel_id,promo_id,quantity_sold,amount_sold

from new_sales;

insert into sales_part

select prod_id,cust_id, sysdate-1,channel_id,promo_id,quantity_sold,amount_sold

from new_sales;

commit;

create index sales_cust_idx on sales_online(cust_id);

create index sales_part_cust_idx on sales_part(cust_id);

--每天晚上把当天数据归档之后，再删除

declare
v_sql varchar2(3000);

begin

   v_sql := 'alter table sales_part drop partition part_20171219';
    execute immediate v_sql;

    v_sql := 'alter table sales_part add partition part_'||to_char(sysdate+1,'yyyymmdd')||
    ' values less than (to_date('||''''||to_char(sysdate+1,'dd-mm-yyyy')||''''||','||''''||'dd-mm-yyyy'||
    ''''||'))';
    dbms_output.put_line(v_sql);
    execute immediate v_sql;

    v_sql := 'alter table sales_part exchange partition part_'||to_char(sysdate+1,'yyyymmdd')||
    ' with table sales_online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

    v_sql := 'truncate table sales_online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

    v_sql := 'alter index sales_part_cust_idx rebuild online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

     v_sql := 'alter index sales_cust_idx rebuild online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

    dbms_stats.gather_table_stats('sh', 'sales_part');
    dbms_stats.gather_table_stats('sh', 'sales_online');


end;

-- 检查统计信息

    select column_name,
     num_distinct, --唯一值的个数
     low_value, --列上的最小值
     high_value, --列上的最大值
     density, --选择率因子（密度） = 1/(ndv),如果不存在柱状图的话
     num_nulls, --空值的个数
     num_buckets, --直方图的bucket个数
     histogram --直方图的类型
     from user_tab_columns
     where table_name='sales_online'

   select num_rows, --表中的记录数
    blocks, --表中数据所占的数据块数
    empty_blocks, --表中的空块数
    avg_space, --数据块中平均的使用空间
    chain_cnt, --表中行连接和行迁移的数量
    avg_row_len, --每条记录的平均长度
    last_analyzed -- 最近一次搜集统计信息的时间
    from user_tables where table_name='sales_online';

====实例1

--进行查询

select c.cust_city, sum(amount_sold) from sales_part s, new_customers c

where s.cust_id = c.cust_id

and s.cust_id > 100

and time_id between to_date('2017-12-18 00:00:00' ,'yyyy-mm-dd hh24:mi:ss') and

to_date('2017-12-18 01:00:00', 'yyyy-mm-dd hh24:mi:ss')

group by c.cust_city

----------------------------------------------------------------------------------------------------------

|   0 | select statement         |               |     1 |    48 | 1779   (1)| 00:00:22 | |        |

|   1 | hash group by           |               |     1 |    48 | 1779   (1)| 00:00:22 | |        |

|* 2 |   hash join              |               |     1 |    48 | 1778   (1)| 00:00:22 | |        |

|   3 |    partition range single|               |     1 |    18 | 1373   (1)| 00:00:17 |     2 |     2 |

|* 4 |     table access full    | sales_part    |     1 |    18 | 1373   (1)| 00:00:17 |     2 |     2 |

|* 5 |    table access full     | new_customers | 54144 | 1586k|   405   (1)| 00:00:05 | |        |

-------------------------------------------------------------------------------------------

select c.cust_city, sum(amount_sold) from sales_online s, new_customers c

where s.cust_id = c.cust_id

and s.cust_id > 100

and time_id between to_date('2017-12-20 00:00:00' ,'yyyy-mm-dd hh24:mi:ss') and

to_date('2017-12-20 01:00:00', 'yyyy-mm-dd hh24:mi:ss')

group by c.cust_city

------------------------------------------------------------------------------------------------

| id | operation                     | name           | rows | bytes | cost (%cpu)| time     |

------------------------------------------------------------------------------------------------

|   0 | select statement              |                |     1 |    65 |   406   (1)| 00:00:05 |

|   1 | hash group by                |                |     1 |    65 |   406   (1)| 00:00:05 |

|* 2 |   hash join                   |                |     1 |    65 |   405   (1)| 00:00:05 |

|* 3 |    table access by index rowid| sales_online   |     1 |    35 |     0   (0)| 00:00:01 |

|* 4 |     index range scan          | sales_cust_idx |     1 |       |     0   (0)| 00:00:01 |

|* 5 |    table access full          | new_customers | 54144 | 1586k|   405   (1)| 00:00:05 |

------------------------------------------------------------------------------------------------

--向表sales_online 中插入一些数据

insert into sales_online

select prod_id,cust_id, sysdate,channel_id,promo_id,quantity_sold,amount_sold

from new_sales;

commit;

--再次查询数据

select c.cust_city, sum(amount_sold) from sales_online s, new_customers c

where s.cust_id = c.cust_id

and s.cust_id > 100

and time_id between to_date('2017-12-20 00:00:00' ,'yyyy-mm-dd hh24:mi:ss') and

to_date('2017-12-20 01:00:00', 'yyyy-mm-dd hh24:mi:ss')

group by c.cust_city

------------------------------------------------------------------------------------------------

|   0 | select statement              |                |     1 |    65 |   406   (1)| 00:00:05 |

|   1 | hash group by                |                |     1 |    65 |   406   (1)| 00:00:05 |

|* 2 |   hash join                   |                |     1 |    65 |   405   (1)| 00:00:05 |

|* 3 |    table access by index rowid| sales_online   |     1 |    35 |     0   (0)| 00:00:01 |

|* 4 |     index range scan          | sales_cust_idx |     1 |       |     0   (0)| 00:00:01 |

|* 5 |    table access full          | new_customers | 54144 | 1586k|   405   (1)| 00:00:05 |

------------------------------------------------------------------------------------------------

--手动搜集统计信息或许是一个办法

exec dbms_stats.gather_table_stats('sh', 'sales_online', cascade => true);

-------------------------------------------------------------------------------------

| id | operation           | name          | rows | bytes | cost (%cpu)| time     |

-------------------------------------------------------------------------------------

|   0 | select statement    |               |     1 |    48 | 1641   (1)| 00:00:20 |

|   1 | hash group by      |               |     1 |    48 | 1641   (1)| 00:00:20 |

|* 2 |   hash join         |               |     1 |    48 | 1640   (1)| 00:00:20 |

|* 3 |    table access full| sales_online |     1 |    18 | 1235   (1)| 00:00:15 |

|* 4 |    table access full| new_customers | 54144 | 1586k|   405   (1)| 00:00:05 |

-------------------------------------------------------------------------------------

执行计划变了过来。但是这不是一个好的办法，因为在生产时间搜集统计信息比较危险。

—-可以这样做

declare
v_sql varchar2(3000);

begin

   v_sql := 'alter table sales_part drop partition part_20171219';
    execute immediate v_sql;

    --导出统计信息
    dbms_stats.export_table_stats(ownname =>'sh',tabname=>'sales_online',stattab=>'sales_online_st',statid => 'a2');

    v_sql := 'alter table sales_part add partition part_'||to_char(sysdate+1,'yyyymmdd')||
    ' values less than (to_date('||''''||to_char(sysdate+1,'dd-mm-yyyy')||''''||','||''''||'dd-mm-yyyy'||
    ''''||'))';
    dbms_output.put_line(v_sql);
    execute immediate v_sql;

    v_sql := 'alter table sales_part exchange partition part_'||to_char(sysdate+1,'yyyymmdd')||
    ' with table sales_online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

    v_sql := 'truncate table sales_online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

    v_sql := 'alter index sales_part_cust_idx rebuild online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

     v_sql := 'alter index sales_cust_idx rebuild online';
    execute immediate v_sql;
    dbms_output.put_line(v_sql);

    dbms_stats.gather_table_stats('sh', 'sales_part');
    --dbms_stats.gather_table_stats('sh', 'sales_online');

--导入统计信息
dbms_stats.import_table_stats(ownname => 'sh', tabname => 'sales_online', stattab => 'sales_online_st', statid => 'a2', no_invalidate => true);

end;

推荐阅读

hash
MySQL索引详解与优化

本文深入探讨了MySQL中的索引机制，包括索引的基本概念、优势与劣势、分类及其实现原理，并详细介绍了索引的使用场景和优化技巧。通过具体示例，帮助读者更好地理解和应用索引以提升数据库性能。 ... [详细]

蜡笔小新 2024-12-25 19:52:47
hash
深入理解 SQL 视图、存储过程与事务

本文详细介绍了SQL中的视图、存储过程和事务的概念及应用。视图为用户提供了一种灵活的数据查询方式，存储过程则封装了复杂的SQL逻辑，而事务确保了数据库操作的完整性和一致性。 ... [详细]

蜡笔小新 2024-12-27 17:40:42
foreach
MyBatis 动态 SQL 详解与应用

本文深入探讨 MyBatis 中动态 SQL 的使用方法，包括 if/where、trim 自定义字符串截取规则、choose 分支选择、封装查询和修改条件的 where/set 标签、批量处理的 foreach 标签以及内置参数和 bind 的用法。 ... [详细]

蜡笔小新 2024-12-27 16:20:10
default
利用存储过程构建年度日历表的详细指南

本文将介绍如何使用SQL存储过程创建一个完整的年度日历表。通过实例演示，帮助读者掌握存储过程的应用技巧，并提供详细的代码解析和执行步骤。 ... [详细]

蜡笔小新 2024-12-26 18:20:17
default
长春大学软件工程：二叉排序树实验报告

本实验主要探讨了二叉排序树（BST）的基本操作，包括创建、查找和删除节点。通过具体实例和代码实现，详细介绍了如何使用递归和非递归方法进行关键字查找，并展示了删除特定节点后的树结构变化。 ... [详细]

蜡笔小新 2024-12-26 15:32:56
default
openGauss每日一练：第6天 - 模式的创建、修改与删除

本篇笔记记录了openGauss数据库中关于模式（Schema）的创建、修改和删除操作。通过这些操作，用户可以更好地管理和控制数据库对象。实验环境为openGauss 2.0.0，并使用由墨天轮提供的线上环境。 ... [详细]

蜡笔小新 2024-12-26 00:17:35
default
MySQL LAST_INSERT_ID() 函数深入解析

本文详细介绍了 MySQL 中 LAST_INSERT_ID() 函数的使用方法及其工作原理，包括如何获取最后一个插入记录的自增 ID、多行插入时的行为以及在不同客户端环境下的表现。 ... [详细]

蜡笔小新 2024-12-25 22:04:04
default
深入理解 Oracle 存储函数：计算员工年收入

本文介绍如何使用 Oracle 存储函数查询特定员工的年收入。我们将详细解释存储函数的创建过程，并提供完整的代码示例。 ... [详细]

蜡笔小新 2024-12-28 09:49:42
foreach
Akka BackoffSupervisor的深入解析与实践

本文详细介绍了Akka中的BackoffSupervisor机制，探讨其在处理持久化失败和Actor重启时的应用。通过具体示例，展示了如何配置和使用BackoffSupervisor以实现更细粒度的异常处理。 ... [详细]

蜡笔小新 2024-12-27 15:04:09
foreach
网站与MySQL数据库的连接与交互

本文详细介绍了如何通过多种编程语言（如PHP、JSP）实现网站与MySQL数据库的连接，包括创建数据库、表的基本操作，以及数据的读取和写入方法。 ... [详细]

蜡笔小新 2024-12-27 14:09:23
foreach
Objective-C 编程中的关键语法点

本文探讨了 Objective-C 中的一些重要语法特性，包括 goto 语句、块（block）的使用、访问修饰符以及属性管理等。通过实例代码和详细解释，帮助开发者更好地理解和应用这些特性。 ... [详细]

蜡笔小新 2024-12-26 19:42:38
foreach
Splay Tree 区间操作优化

本文详细介绍了使用Splay Tree进行区间操作的实现方法，包括插入、删除、修改、翻转和求和等操作。通过这些操作，可以高效地处理动态序列问题，并且代码实现具有一定的挑战性，有助于编程能力的提升。 ... [详细]

蜡笔小新 2024-12-26 18:47:12
hash
从 .NET 转 Java 的自学之路：IO 流基础篇

本文详细介绍了 Java 中的 IO 流，包括字节流和字符流的基本概念及其操作方式。探讨了如何处理不同类型的文件数据，并结合编码机制确保字符数据的正确读写。同时，文中还涵盖了装饰设计模式的应用，以及多种常见的 IO 操作实例。 ... [详细]

蜡笔小新 2024-12-26 17:37:25
version
使用 SQLiteJDBC 和 HikariCP 实现 Java 程序连接 SQLite 数据库

本文介绍了如何通过 Maven 依赖引入 SQLiteJDBC 和 HikariCP 包，从而在 Java 应用中高效地连接和操作 SQLite 数据库。文章提供了详细的代码示例，并解释了每个步骤的实现细节。 ... [详细]

蜡笔小新 2024-12-26 17:34:42
default
PostgreSQL中的模式管理

本文由瀚高PG实验室撰写，详细介绍了如何在PostgreSQL中创建、管理和删除模式。文章涵盖了创建模式的基本命令、public模式的特性、权限设置以及通过角色对象简化操作的方法。 ... [详细]

蜡笔小新 2024-12-26 11:37:26

我的饭桶女神

这个家伙很懒，什么也没留下！

Tags | 热门标签

RankList | 热门文章