转载:postgresql分区与优化

时间:2021-03-30 01:32:38
--对于分区表constraint_exclusion 这个参数需要配置为partition或on
postgres=# show constraint_exclusion ;
constraint_exclusion
----------------------
partition --创建父子表, 用于存储分区数据
create table t(id int primary key);
create table t1(like t including all) inherits(t);
create table t2(like t including all) inherits(t);
create table t3(like t including all) inherits(t);
create table t4(like t including all) inherits(t);
--PostgreSQL的子表和子表之间的约束是没有任何关系的, 所以也可以有重叠, 即非全局约束.
alter table t1 add constraint ck_t1_1 check(id<0);
alter table t2 add constraint ck_t2_1 check(id>=0 and id<100);
alter table t3 add constraint ck_t3_1 check(id>=100 and id<200);
alter table t4 add constraint ck_t4_1 check(id>=200); --分区字段传入常量, 执行时扫描的是父表和约束对应的子表 :
postgres=# explain select * from t where id=10;
QUERY PLAN
-----------------------------------------------------------------------------
Append (cost=0.00..8.17 rows=2 width=4)
-> Seq Scan on t (cost=0.00..0.00 rows=1 width=4)
Filter: (id = 10)
-> Index Only Scan using t2_pkey on t2 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 10)
(5 rows) --分区字段传入常量, 执行时扫描的是父表和约束对应的子表;
postgres=# prepare p_test as select * from t where id=$1;
PREPARE
postgres=# explain execute p_test(1);
QUERY PLAN
-----------------------------------------------------------------------------
Append (cost=0.00..8.17 rows=2 width=4)
-> Seq Scan on t (cost=0.00..0.00 rows=1 width=4)
Filter: (id = 1)
-> Index Only Scan using t2_pkey on t2 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 1)
(5 rows) --子句查询, 执行时扫描的是父表和所有子表, 注意这里使用的子查询是子表的查询, 理论上应该是扫描父表和该子表
postgres=# explain select * from t where id=(select id from t1 limit 1);
QUERY PLAN
-----------------------------------------------------------------------------
Append (cost=0.01..32.70 rows=5 width=4)
InitPlan 1 (returns $0)
-> Limit (cost=0.00..0.01 rows=1 width=4)
-> Seq Scan on t1 t1_1 (cost=0.00..34.00 rows=2400 width=4)
-> Seq Scan on t (cost=0.00..0.00 rows=1 width=4)
Filter: (id = $0)
-> Index Only Scan using t1_pkey on t1 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = $0)
-> Index Only Scan using t2_pkey on t2 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = $0)
-> Index Only Scan using t3_pkey on t3 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = $0)
-> Index Only Scan using t4_pkey on t4 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = $0)
(14 rows) --综上可知在对分区表进行查询时最好使用字面常量,而不要使用子查询之类复杂的sql --如果子表上约束删除,则pg不得不把删除约束的子表也加入到查询中(即使子表可以忽略)
alter table t4 drop constraint ck_t4_1;
postgres=# explain select * from t where id=10;
QUERY PLAN
-----------------------------------------------------------------------------
Append (cost=0.00..16.34 rows=3 width=4)
-> Seq Scan on t (cost=0.00..0.00 rows=1 width=4)
Filter: (id = 10)
-> Index Only Scan using t2_pkey on t2 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 10)
-> Index Only Scan using t4_pkey on t4 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 10)
(7 rows) --如果constraint_exclusion设置为off,pg不得不进行全表扫描
postgres=# set constraint_exclusion=off;
SET
postgres=# explain select * from t where id=10;
QUERY PLAN
-----------------------------------------------------------------------------
Append (cost=0.00..32.69 rows=5 width=4)
-> Seq Scan on t (cost=0.00..0.00 rows=1 width=4)
Filter: (id = 10)
-> Index Only Scan using t1_pkey on t1 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 10)
-> Index Only Scan using t2_pkey on t2 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 10)
-> Index Only Scan using t3_pkey on t3 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 10)
-> Index Only Scan using t4_pkey on t4 (cost=0.15..8.17 rows=1 width=4)
Index Cond: (id = 10)
(11 rows) --分区表上一般针对分区建立相对应的分区索引
--建在父表的索引为全局索引,但如果你表没有数据要查询子表时,则分区表要进行全表扫描 --父表建立的全局索引
postgres=# \d+ p
Table "public.p"
Column | Type | Modifiers | Storage | Stats target | Description
-----------+--------------------------------+-----------+---------+--------------+-------------
city_id | integer | not null | plain | |
logtime | timestamp(0) without time zone | not null | plain | |
peaktemp | integer | | plain | |
unitsales | integer | | plain | |
Indexes:
"idx_city_id" btree (city_id)
"idx_p_logtime" btree (logtime)
Triggers:
delete_p_trigger BEFORE DELETE ON p FOR EACH ROW EXECUTE PROCEDURE p_delete_trigger()
insert_p_trigger BEFORE INSERT ON p FOR EACH ROW EXECUTE PROCEDURE p_insert_trigger()
Child tables: p_201201,
p_201202,
p_201203,
p_201204,
p_201205,
p_201206,
p_201207,
p_201208,
p_201209,
p_201210,
p_201211,
p_201212,
p_default
Has OIDs: no --分区没有索引,不能使用父表索引
postgres=# explain select * from p_201202 where city_id=2 and logtime=timestamp '2012-02-02 12:59:59';
QUERY PLAN
----------------------------------------------------------------------------------------------
Seq Scan on p_201202 (cost=0.00..214.01 rows=2 width=20)
Filter: ((city_id = 2) AND (logtime = '2012-02-02 12:59:59'::timestamp without time zone))
(2 rows) --建立分区索引,可以使用分区索引
postgres=# CREATE INDEX idx_p_201202_city_id ON p_201202 (city_id);
CREATE INDEX
postgres=# explain select * from p_201202 where city_id=2 and logtime=timestamp '2012-02-02 12:59:59';
QUERY PLAN
--------------------------------------------------------------------------------------
Index Scan using idx_p_201202_city_id on p_201202 (cost=0.29..8.33 rows=2 width=20)
Index Cond: (city_id = 2)
Filter: (logtime = '2012-02-02 12:59:59'::timestamp without time zone) --也可以指定只查询父表的数据 postgres=# select * from only p;
city_id | logtime | peaktemp | unitsales
---------+---------+----------+-----------
(0 rows) --如果一个分区表,父子表之间不再有继承关系,则查询父表时不再过滤到子表
postgres=# alter table t3 no inherit t;
ALTER TABLE
postgres=# explain select count(*) from t;
QUERY PLAN
------------------------------------------------------------------
Aggregate (cost=73.50..73.51 rows=1 width=0)
-> Append (cost=0.00..62.80 rows=4281 width=0)
-> Seq Scan on t (cost=0.00..0.00 rows=1 width=0)
-> Seq Scan on t1 (cost=0.00..31.40 rows=2140 width=0)
-> Seq Scan on t2 (cost=0.00..31.40 rows=2140 width=0)
(5 rows) --再次添加继承,查询父表可以过滤到子表
postgres=# alter table t3 inherit t;
ALTER TABLE
postgres=# explain select count(*) from t;
QUERY PLAN
------------------------------------------------------------------
Aggregate (cost=110.25..110.26 rows=1 width=0)
-> Append (cost=0.00..94.20 rows=6421 width=0)
-> Seq Scan on t (cost=0.00..0.00 rows=1 width=0)
-> Seq Scan on t1 (cost=0.00..31.40 rows=2140 width=0)
-> Seq Scan on t2 (cost=0.00..31.40 rows=2140 width=0)
-> Seq Scan on t3 (cost=0.00..31.40 rows=2140 width=0)
(6 rows) --以下为p表测试数据代码
CREATE TABLE p (
city_id int not null,
logtime timestamp(0) not null,
peaktemp int,
unitsales int
); CREATE INDEX idx_p_logtime ON p (logtime); CREATE TABLE p_201201 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201202 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201203 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201204 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201205 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201206 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201207 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201208 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201209 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201210 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201211 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_201212 (LIKE p INCLUDING all) INHERITS (p);
CREATE TABLE p_default (LIKE p INCLUDING all) INHERITS (p); CREATE OR REPLACE FUNCTION p_insert_trigger()
RETURNS TRIGGER AS $$
BEGIN
IF ( NEW.logtime >= DATE '2012-01-01' AND NEW.logtime < DATE '2012-02-01' ) THEN
INSERT INTO p_201201 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-02-01' AND NEW.logtime < DATE '2012-03-01' ) THEN
INSERT INTO p_201202 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-03-01' AND NEW.logtime < DATE '2012-04-01' ) THEN
INSERT INTO p_201203 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-04-01' AND NEW.logtime < DATE '2012-05-01' ) THEN
INSERT INTO p_201204 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-05-01' AND NEW.logtime < DATE '2012-06-01' ) THEN
INSERT INTO p_201205 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-06-01' AND NEW.logtime < DATE '2012-07-01' ) THEN
INSERT INTO p_201206 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-07-01' AND NEW.logtime < DATE '2012-08-01' ) THEN
INSERT INTO p_201207 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-08-01' AND NEW.logtime < DATE '2012-09-01' ) THEN
INSERT INTO p_201208 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-09-01' AND NEW.logtime < DATE '2012-10-01' ) THEN
INSERT INTO p_201209 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-10-01' AND NEW.logtime < DATE '2012-11-01' ) THEN
INSERT INTO p_201210 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-11-01' AND NEW.logtime < DATE '2012-12-01' ) THEN
INSERT INTO p_201211 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2012-12-01' AND NEW.logtime < DATE '2013-01-01' ) THEN
INSERT INTO p_201212 VALUES (NEW.*);
ELSIF ( NEW.logtime >= DATE '2013-01-01' OR NEW.logtime < DATE '2012-01-01' ) THEN
INSERT INTO p_default VALUES (NEW.*);
ELSE
RAISE EXCEPTION 'Date out of range. Fix the p_insert_trigger() function!';
END IF;
RETURN NULL;
END;
$$ LANGUAGE plpgsql; CREATE OR REPLACE FUNCTION p_delete_trigger()
RETURNS TRIGGER AS $$
BEGIN
IF ( OLD.logtime >= DATE '2012-01-01' AND OLD.logtime < DATE '2012-02-01' ) THEN
DELETE FROM p_201201 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-02-01' AND OLD.logtime < DATE '2012-03-01' ) THEN
DELETE FROM p_201202 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-03-01' AND OLD.logtime < DATE '2012-04-01' ) THEN
DELETE FROM p_201203 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-04-01' AND OLD.logtime < DATE '2012-05-01' ) THEN
DELETE FROM p_201204 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-05-01' AND OLD.logtime < DATE '2012-06-01' ) THEN
DELETE FROM p_201205 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-06-01' AND OLD.logtime < DATE '2012-07-01' ) THEN
DELETE FROM p_201206 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-07-01' AND OLD.logtime < DATE '2012-08-01' ) THEN
DELETE FROM p_201207 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-08-01' AND OLD.logtime < DATE '2012-09-01' ) THEN
DELETE FROM p_201208 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-09-01' AND OLD.logtime < DATE '2012-10-01' ) THEN
DELETE FROM p_201209 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-10-01' AND OLD.logtime < DATE '2012-11-01' ) THEN
DELETE FROM p_201210 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-11-01' AND OLD.logtime < DATE '2012-12-01' ) THEN
DELETE FROM p_201211 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2012-12-01' AND OLD.logtime < DATE '2013-01-01' ) THEN
DELETE FROM p_201212 WHERE logtime=OLD.logtime;
ELSIF ( OLD.logtime >= DATE '2013-01-01' OR OLD.logtime < DATE '2012-01-01' ) THEN
DELETE FROM p_default WHERE logtime=OLD.logtime;
ELSE
RAISE EXCEPTION 'Date out of range. Fix the p_insert_trigger() function!';
END IF;
RETURN NULL;
END;
$$ LANGUAGE plpgsql; CREATE TRIGGER insert_p_trigger
BEFORE INSERT ON p
FOR EACH ROW EXECUTE PROCEDURE p_insert_trigger(); CREATE TRIGGER delete_p_trigger
BEFORE DELETE ON p
FOR EACH ROW EXECUTE PROCEDURE p_delete_trigger(); INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (1, timestamp '2012-01-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (2, timestamp '2012-02-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (3, timestamp '2012-03-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (4, timestamp '2012-04-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (5, timestamp '2012-05-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (6, timestamp '2012-06-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (7, timestamp '2012-07-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (8, timestamp '2012-08-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (9, timestamp '2012-09-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (10, timestamp '2012-10-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (11, timestamp '2012-11-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (12, timestamp '2012-12-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (13, timestamp '2013-01-02 12:59:59', 20, 10);
INSERT INTO p (city_id, logtime, peaktemp, unitsales) VALUES (14, timestamp '2011-12-02 12:59:59', 20, 10); INSERT INTO p (city_id, logtime, peaktemp, unitsales) select m, timestamp '2012-02-02 12:59:59', 20, 10 from generate_series(1,10000) m; explain select * from p_201202 where city_id=2 and logtime=timestamp '2012-02-02 12:59:59';
转载:https://yq.aliyun.com/articles/2637?spm=5176.100240.searchblog.12.59Jibq#

转载:postgresql分区与优化的更多相关文章

  1. PostgreSQL之性能优化(转)

    转载自:https://blog.csdn.net/huangwenyi1010/article/details/72853785 解决问题 前言 PostgreSQL的配置参数作为性能调优的一部分, ...

  2. PostgreSQL 分区索引演进

    PostgreSQL 分区表,操作性相当便捷. 但只能在创建时决定是否为分区表,并决定分区条件字段,普通表创建后,不能在修改为分区表. Note:通过其他方法也可转化为分区表. 和其他数据库一样,分区 ...

  3. 【转载】PHP性能优化干货

    PHP优化对于PHP的优化主要是对php.ini中的相关主要参数进行合理调整和设置,以下我们就来看看php.ini中的一些对性能影响较大的参数应该如何设置. # vi /etc/php.ini (1) ...

  4. 【转载】 Spark性能优化指南——基础篇

    转自:http://tech.meituan.com/spark-tuning-basic.html?from=timeline 前言 开发调优 调优概述 原则一:避免创建重复的RDD 原则二:尽可能 ...

  5. 【转载】MySQL性能优化的最佳20&plus;条经验

    今天,数据库的操作越来越成为整个应用的性能瓶颈了,这点对于Web应用尤其明显.关于数据库的性能,这并不只是DBA才需要担心的事,而这更是我们程序员需要去关注的事情.当我们去设计数据库表结构,对操作数据 ...

  6. &lbrack;转载&rsqb;U3d常规性能优化技巧

    以下技巧并不是必须的,但是对于想要提升游戏性能的人来说应该还是很不错的. 优化的常规技巧 n 剖析你的游戏. 不要花费时间来优化那些晦涩的代码或者缩减图形文件的大小,除非这是你游戏的瓶颈.第一次剖析你 ...

  7. 转载 50种方法优化SQL Server数据库查询

    原文地址 http://www.cnblogs.com/zhycyq/articles/2636748.html 50种方法优化SQL Server数据库查询 查询速度慢的原因很多,常见如下几种: 1 ...

  8. 【转载】 Spark性能优化:资源调优篇

    在开发完Spark作业之后,就该为作业配置合适的资源了.Spark的资源参数,基本都可以在spark-submit命令中作为参数设置.很多Spark初学者,通常不知道该设置哪些必要的参数,以及如何设置 ...

  9. PostgreSQL查询优化逻辑优化之其他

    上一节我们介绍了PostgreSQL的子查询优化,子查询优化把一部分可以优化的子查询上拉到主查询成为join. preprocess_expression 将表达式(目标列,where,join,ha ...

随机推荐

  1. Redis 学习笔记(C&num;)

    Redis安装及简单操作 Windows下安装步骤: 1. 第一步当然是先下载咯~  地址:https://github.com/dmajkic/redis/downloads (根据自己实际情况选择 ...

  2. Hibernate SQL优化技巧dynamic-insert&equals;&quot&semi;true&quot&semi; dynamic-update&equals;&quot&semi;true&quot&semi;

    最近正在拜读Hibernate之父大作<Java Persistence with Hibernate>,颇有收获.在我们熟悉的Hibernate映射文件中也大有乾坤,很多值得我注意的地方 ...

  3. (转载)链表环中的入口点 编程之美 leecode 学习

    http://www.cnblogs.com/hiddenfox/p/3408931.html 说的很细 /** * Definition for singly-linked list. * clas ...

  4. Altium Designer10 如何导出Gerber文件

    版本:AD10.818 目的:Gerber文件导出备忘 http://blog.sina.com.cn/s/blog_9b9a51990100zyyv.html 目录: Step1:设置原点 Step ...

  5. Ps 美白磨皮【1】

      方法一:去色加图层模式法 打开需要编辑的图片,按Ctrl+J复制新的图层1. 点击菜单栏“图像”-“调整”-“去色”,如下图所示. 将图层面板的混合模式更改为“滤色”,如下图4所示. 最后的显示效 ...

  6. Java之线程的生命周期

    在Java中,线程有5中不同状态,分别是:新建(New).就绪(Runable).运行(Running).阻塞(Blocked)和死亡(Dead).它们之间的转换图如下: 上图有一个例外,调用yiel ...

  7. J2EE

    随笔分类 - J2EE   关于SpringMVC Json使用 摘要: 很简单的一个东西,这里就不做过多介绍了,写一个小Demo,随手记录下.首先,在搭好SpringMVC工程环境之后,如果想用Sp ...

  8. public,private,protected,以及不写时的差别

    作用域public,private.protected.以及不写时的差别 这四个作用域的可见范围例如以下表所看到的. 说明:假设在修饰的元素上面没有写不论什么訪问修饰符,则表示friendly.不使用 ...

  9. 关于block的循环引用的问题

    在block的循环引用的问题上我们都知道如果在block内部修改外部的变量的时候,要加__block以防止循环引用的问题,但是如果block是当前对象的一个属性的时候,要修改当前对象的一个属性的时候就 ...

  10. 从零开始学习PYTHON3讲义(十六)(连载完)学习资源包下载

    <从零开始PYTHON3>学习资源包下载 课程连载已经完全结束. 经过整理校对,这里把在课程中出现过的源码和练习答案示例源码全部打包提供下载: https://pan.baidu.com/ ...