学习目标
学习openGauss收集统计信息、打印执行计划、垃圾收集和checkpoint
课程学习
连接数据库
root@modb:~# su - omm
omm@modb:~$ gsql -r课程作业
1.创建分区表,并用generate_series(1,N)函数对表插入数据
Create schema tpcds;
CREATE TABLE tpcds.customer_address
(
ca_address_sk integer NOT NULL ,
ca_address_id character(16),
ca_street_number character(10) ,
ca_street_name character varying(60) ,
ca_street_type character(15) ,
ca_suite_number character(10) ,
ca_city character varying(60) ,
ca_county character varying(30) ,
ca_state character(2) ,
ca_zip character(10) ,
ca_country character varying(20) ,
ca_gmt_offset numeric(5,2) ,
ca_location_type character(20)
);
insert into tpcds.customer_address values
(1, 'AAAAAAAABAAAAAAA', '18', 'Jackson', 'Parkway', 'Suite 280', 'Fairfield', 'Maricopa County', 'AZ', '86192' ,'United States', -7.00, 'condo'),
(2, 'AAAAAAAACAAAAAAA', '362', 'Washington 6th', 'RD', 'Suite 80', 'Fairview', 'Taos County', 'NM', '85709', 'United States', -7.00, 'condo'),
(3, 'AAAAAAAADAAAAAAA', '585', 'Dogwood Washington', 'Circle', 'Suite Q', 'Pleasant Valley', 'York County', 'PA', '12477', 'United States', -5.00, 'single family');
insert into tpcds.customer_address values(generate_series(10, 10000));
–使用序列的generate_series(1,N)函数对表插入数据
insert into tpcds.customer_address values(generate_series(10, 10000));
2.收集表统计信息
-查看系统表中表的统计信息
select relname, relpages, reltuples from pg_class where relname = 'customer_address';
—使用ANALYZE VERBOSE语句更新统计信息,并输出表的相关信息
analyze VERBOSE tpcds.customer_address;

–查看系统表中表的统计信息
select relname, relpages, reltuples from pg_class where relname = 'customer_address';
3.打印执行计划
–使用默认的打印格式
SET explain_perf_mode=normal;
–显示表简单查询的执行计划
EXPLAIN SELECT * FROM tpcds.customer_address;

–以JSON格式输出的执行计划(explain_perf_mode为normal时)
EXPLAIN(FORMAT JSON) SELECT * FROM tpcds.customer_address;

–禁止开销估计的执行计划
EXPLAIN(COSTS FALSE)SELECT * FROM tpcds.customer_address;

–带有聚集函数查询的执行计划
EXPLAIN SELECT SUM(ca_address_sk) FROM tpcds.customer_address WHERE ca_address_sk<100;

–有索引条件的执行计划
create index customer_address_idx on tpcds.customer_address(ca_address_sk);
EXPLAIN SELECT * FROM tpcds.customer_address WHERE ca_address_sk<100;
4.垃圾收集
–VACUUM回收表或B-Tree索引中已经删除的行所占据的存储空间
update tpcds.customer_address set ca_address_sk = ca_address_sk + 1 where ca_address_sk <100;
VACUUM (VERBOSE, ANALYZE) tpcds.customer_address;
5.事务日志检查点
–检查点(CHECKPOINT)是一个事务日志中的点,所有数据文件都在该点被更新以反映日志中的信息,所有数据文件都将被刷新到磁盘
CHECKPOINT;6.清理数据
drop schema tpcds cascade;
课后作业
1.创建分区表,并用generate_series(1,N)函数对表插入数据
create schema tpcds;
create table tpcds.chenyq
(
c_id integer not null,
c_name character varying(20),
c_type character(15),
c_city character varying(50),
c_state character(5),
c_location character(50)
)
partition by range(c_id)
(
partition chenyq_p1 values less than(20000),
partition chenyq_p2 values less than(40000),
partition chenyq_p3 values less than(60000),
partition chenyq_p4 values less than(80000),
partition chenyq_p5 values less than(100000),
partition chenyq_p6 values less than(maxvalue)
);
insert into tpcds.chenyq values(generate_series(1,100000));
2.收集表统计信息
select relname,relpages,reltuples from pg_class where relname = 'chenyq';
analyze verbose tpcds.chenyq;
select relname,relpages,reltuples from pg_class where relname = 'chenyq';
3.显示简单查询的执行计划;建立索引并显示有索引条件的执行计划
explain select * from tpcds.chenyq;
create index chenyq_idx on tpcds.chenyq(c_id);
explain select * from tpcds.chenyq where c_id < 1000;
4.更新表数据,并做垃圾收集
update tpcds.chenyq set c_id = c_id + 5 where c_id < 10000;
vacuum (verbose,analyze) tpcds.chenyq;
5.清理数据
drop schema tpcds cascade;
最后修改时间:2022-09-08 10:09:25
「喜欢这篇文章,您的关注和赞赏是给作者最好的鼓励」
关注作者
【版权声明】本文为墨天轮用户原创内容,转载时必须标注文章的来源(墨天轮),文章链接,文章作者等基本信息,否则作者和墨天轮有权追究责任。如果您发现墨天轮中有涉嫌抄袭或者侵权的内容,欢迎发送邮件至:contact@modb.pro进行举报,并提供相关证据,一经查实,墨天轮将立刻删除相关内容。













