基于patroni+etcd的postgresql高可用搭建

姬向明

2023-12-01

1.环境

centos 7.4

postgresql 10.5

物理ip

192.168.199.240 （node1）

192.168.199.241 （node2）

192.168.199.242 （node3）

vip

192.168.199.248

192.168.199.249

2.安装patroni和ectd

yum install -y gcc python-devel epel-release
yum install -y etcd
yum install -y python2-pip
pip install --upgrade setuptools
pip install psycopg2-binary
pip install python-etcd
pip install patroni
3.配置etcd文件

node1
vi /etc/etcd/etcd.conf

ETCD_DATA_DIR="/var/lib/etcd/node1.etcd"
ETCD_LISTEN_PEER_URLS="http://192.168.199.240:2380,http://127.0.0.1:2380"
ETCD_LISTEN_CLIENT_URLS="http://192.168.199.240:2379,http://127.0.0.1:2379"
ETCD_NAME="node1"
ETCD_INITIAL_ADVERTISE_PEER_URLS="http://192.168.199.240:2380"
ETCD_ADVERTISE_CLIENT_URLS="http://192.168.199.240:2379"
ETCD_INITIAL_CLUSTER="node1=http://192.168.199.240:2380,node2=http://192.168.199.241:2380,node3=http://192.168.199.242:2380"
ETCD_INITIAL_CLUSTER_TOKEN="etcd-cluster"
ETCD_INITIAL_CLUSTER_STATE="new"
node2
vi /etc/etcd/etcd.conf

ETCD_DATA_DIR="/var/lib/etcd/node2.etcd"
ETCD_LISTEN_PEER_URLS="http://192.168.199.241:2380,http://127.0.0.1:2380"
ETCD_LISTEN_CLIENT_URLS="http://192.168.199.241:2379,http://127.0.0.1:2379"
ETCD_NAME="node2"
ETCD_INITIAL_ADVERTISE_PEER_URLS="http://192.168.199.241:2380"
ETCD_ADVERTISE_CLIENT_URLS="http://192.168.199.241:2379"
ETCD_INITIAL_CLUSTER="node1=http://192.168.199.240:2380,node2=http://192.168.199.241:2380,node3=http://192.168.199.242:2380"
ETCD_INITIAL_CLUSTER_TOKEN="etcd-cluster"
ETCD_INITIAL_CLUSTER_STATE="new"
node3
vi /etc/etcd/etcd.conf

ETCD_DATA_DIR="/var/lib/etcd/node3.etcd"
ETCD_LISTEN_PEER_URLS="http://192.168.199.242:2380,http://127.0.0.1:2380"
ETCD_LISTEN_CLIENT_URLS="http://192.168.199.242:2379,http://127.0.0.1:2379"
ETCD_NAME="node3"
ETCD_INITIAL_ADVERTISE_PEER_URLS="http://192.168.199.242:2380"
ETCD_ADVERTISE_CLIENT_URLS="http://192.168.199.242:2379"
ETCD_INITIAL_CLUSTER="node1=http://192.168.199.240:2380,node2=http://192.168.199.241:2380,node3=http://192.168.199.242:2380"
ETCD_INITIAL_CLUSTER_TOKEN="etcd-cluster"
ETCD_INITIAL_CLUSTER_STATE="new"
4.安装postgresql

pg数据库参数配置
node1
postgresql.conf

max_connections = '100'
max_wal_senders = '10'
port = '5432'
listen_addresses = '0.0.0.0'
synchronous_commit = on
full_page_writes = on
wal_log_hints = on
synchronous_standby_names = '*'
max_replication_slots = 10
wal_level = replica

node1
pg_hba.conf

host all all 192.168.99.0/24 md5
host replication replicator 192.168.199.240/32 md5
host replication replicator 192.168.199.240/32 md5
host replication replicator 192.168.199.240/32 md5

创建流复制的用户，创建复制槽
create user replicator replication login encrypted password 'replicator';
alter user postgres with password 'postgres';
select * from pg_create_physical_replication_slot('pg10_node1');
select * from pg_create_physical_replication_slot('pg10_node2');
select * from pg_create_physical_replication_slot('pg10_node3');

node2

pg_basebackup -h 192.168.199.240 -D /opt/data -U replicator -v -P -R

vi recovery.conf
recovery_target_timeline = 'latest'
standby_mode = 'on'
primary_conninfo = 'host=192.168.199.240 port=5432 user=replicator password=replicator'
primary_slot_name = 'pg10_node2'
trigger_file = '/tmp/postgresql.trigger.5432'

node3
pg_basebackup -h 192.168.199.240 -D /opt/data -U replicator -v -P -R

vi recovery.conf
recovery_target_timeline = 'latest'
standby_mode = 'on'
primary_conninfo = 'host=192.168.199.240 port=5432 user=replicator password=replicator'
primary_slot_name = 'pg10_node3'
trigger_file = '/tmp/postgresql.trigger.5432'
5.配置patroni文件

vi /usr/patroni/conf/patroni_postgresql.yml

node1

scope: pg10
namespace: /pgsql/
name: pg10_node1

restapi:
listen: 192.168.199.240:8008
connect_address: 192.168.199.240:8008

etcd:
host: 192.168.199.240:2379

bootstrap:
# this section will be written into Etcd:/<namespace>/<scope>/config after initializing new cluster
# and all other cluster members will use it as a `global configuration`
dcs:
ttl: 30
loop_wait: 10
retry_timeout: 10
maximum_lag_on_failover: 1048576
master_start_timeout: 300
synchronous_mode: false
postgresql:
use_pg_rewind: true
use_slots: true
parameters:
listen_addresses: "0.0.0.0"
port: 5432
wal_level: logical
hot_standby: "on"
wal_keep_segments: 1000
max_wal_senders: 10
max_replication_slots: 10
wal_log_hints: "on"
# archive_mode: "on"
# archive_timeout: 1800s
# archive_command: gzip < %p > /data/backup/pgwalarchive/%f.gz
# recovery_conf:
# restore_command: gunzip < /data/backup/pgwalarchive/%f.gz > %p

postgresql:
listen: 0.0.0.0:5432
connect_address: 192.168.199.240:5432
data_dir: /opt/data
bin_dir: /opt/pg10/bin
# config_dir: /etc/postgresql/9.6/main
authentication:
replication:
username: replicator
password: replicator
superuser:
username: postgres
password: postgres

#watchdog:
# mode: automatic # Allowed values: off, automatic, required
# device: /dev/watchdog
# safety_margin: 5

tags:
nofailover: false
noloadbalance: false
clonefrom: false
nosync: false
node2

scope: pg10
namespace: /pgsql/
name: pg10_node2

restapi:
listen: 192.168.199.241:8008
connect_address: 192.168.199.241:8008

etcd:
host: 192.168.199.241:2379

bootstrap:
# this section will be written into Etcd:/<namespace>/<scope>/config after initializing new cluster
# and all other cluster members will use it as a `global configuration`
dcs:
ttl: 30
loop_wait: 10
retry_timeout: 10
maximum_lag_on_failover: 1048576
master_start_timeout: 300
synchronous_mode: false
postgresql:
use_pg_rewind: true
use_slots: true
parameters:
listen_addresses: "0.0.0.0"
port: 5432
wal_level: logical
hot_standby: "on"
wal_keep_segments: 1000
max_wal_senders: 10
max_replication_slots: 10
wal_log_hints: "on"
# archive_mode: "on"
# archive_timeout: 1800s
# archive_command: gzip < %p > /data/backup/pgwalarchive/%f.gz
# recovery_conf:
# restore_command: gunzip < /data/backup/pgwalarchive/%f.gz > %p

postgresql:
listen: 0.0.0.0:5432
connect_address: 192.168.199.241:5432
data_dir: /opt/data
bin_dir: /pg10/postgres10/bin
# config_dir: /etc/postgresql/9.6/main
authentication:
replication:
username: replicator
password: replicator
superuser:
username: postgres
password: postgres

#watchdog:
# mode: automatic # Allowed values: off, automatic, required
# device: /dev/watchdog
# safety_margin: 5

tags:
nofailover: false
noloadbalance: false
clonefrom: false
nosync: false
node3

scope: pg10
namespace: /pgsql/
name: pg10_node3

restapi:
listen: 192.168.199.242:8008
connect_address: 192.168.199.242:8008

etcd:
host: 192.168.199.242:2379

bootstrap:
# this section will be written into Etcd:/<namespace>/<scope>/config after initializing new cluster
# and all other cluster members will use it as a `global configuration`
dcs:
ttl: 30
loop_wait: 10
retry_timeout: 10
maximum_lag_on_failover: 1048576
master_start_timeout: 300
synchronous_mode: false
postgresql:
use_pg_rewind: true
use_slots: true
parameters:
listen_addresses: "0.0.0.0"
port: 5432
wal_level: logical
hot_standby: "on"
wal_keep_segments: 1000
max_wal_senders: 10
max_replication_slots: 10
wal_log_hints: "on"
# archive_mode: "on"
# archive_timeout: 1800s
# archive_command: gzip < %p > /data/backup/pgwalarchive/%f.gz
# recovery_conf:
# restore_command: gunzip < /data/backup/pgwalarchive/%f.gz > %p

postgresql:
listen: 0.0.0.0:5432
connect_address: 192.168.199.242:5432
data_dir: /opt/data
bin_dir: /opt/pg10/bin
# config_dir: /etc/postgresql/9.6/main
authentication:
replication:
username: replicator
password: replicator
superuser:
username: postgres
password: postgres

#watchdog:
# mode: automatic # Allowed values: off, automatic, required
# device: /dev/watchdog
# safety_margin: 5

tags:
nofailover: false
noloadbalance: false
clonefrom: false
nosync: false
6.启动patroni

手动启动 patroni,注意这里需要切换到postgres用户下启动

node1、node2、node3 三个节点依次启动

[postgres@node1 ~]$patroni /usr/patroni/conf/patroni_postgresql.yml
查看集群信息

查看etcd状态

[root@node1 ~]# etcdctl ls /pgsql/pg10
/pgsql/pg10/leader
/pgsql/pg10/config
/pgsql/pg10/optime
/pgsql/pg10/members
/pgsql/pg10/initialize
为了方便开机自启，故配置成 patroni.service，3个node都需要进行配置，配置好patroni.service后就可以直接在root用户下切换Leader以及重启postgres节点等操作

[root@localhost data]# vi /etc/systemd/system/patroni.service
[root@localhost data]# cat /etc/systemd/system/patroni.service
[Unit]
Description=patroni - a high-availability PostgreSQL
Documentation=https://patroni.readthedocs.io/en/latest/index.html
After=syslog.target network.target etcd.target
Wants=network-online.target

[Service]
Type=simple
User=postgres
Group=postgres
PermissionsStartOnly=true
ExecStart=/usr/bin/patroni /usr/patroni/conf/patroni_postgresql.yml
ExecReload=/bin/kill -HUP $MAINPID
LimitNOFILE=65536
KillMode=process
KillSignal=SIGINT
Restart=on-abnormal
RestartSec=30s
TimeoutSec=0

[Install]
WantedBy=multi-user.target

7.常用命令

# 启动服务(会自动启动 pg 实例)
systemctl start patroni
# 关闭服务(会自动关闭 pg 实例)
systemctl stop patroni
# 查看集群状态
patronictl -c /etc/patroni.yml list
# 可以查看命令的使用说明
patronictl --help
# 查看版本号
patronictl -c /etc/patroni.yml version
# 查看所有成员信息
patronictl -c /etc/patroni.yml list
# 重新加载配置
patronictl -c /etc/patroni.yml reload
# 移除集群，重新配置的时候使用
patronictl -c /etc/patroni.yml remove postgres
# 重启数据库集群
patronictl -c /etc/patroni.yml restart postgres
# 切换 Leader，将一个 slave 切换成 leader。
patronictl -c /etc/patroni.yml switchover

参考：https://blog.csdn.net/andou2693/article/details/101549161/

https://mp.weixin.qq.com/s/edvWkTb-WF7YyVAFz5GCfw
https://blog.csdn.net/silenceray/article/details/116144139

基于patroni+etcd的postgresql高可用搭建

相关阅读

相关文章

相关问答

相关文档